diff --git a/db/migrations/0230__vector_embeddings.sql b/db/migrations/0230__vector_embeddings.sql
new file mode 100644
index 000000000..45f14fddf
--- /dev/null
+++ b/db/migrations/0230__vector_embeddings.sql
@@ -0,0 +1,46 @@
+-- Add tables for vector embeddings storage and management
+-- This migration adds embedding support to the main document.db database
+
+-- Store embeddings for notes
+CREATE TABLE IF NOT EXISTS "note_embeddings" (
+    "embedId" TEXT NOT NULL PRIMARY KEY,
+    "noteId" TEXT NOT NULL,
+    "providerId" TEXT NOT NULL,
+    "modelId" TEXT NOT NULL,
+    "dimension" INTEGER NOT NULL,
+    "embedding" BLOB NOT NULL,
+    "version" INTEGER NOT NULL DEFAULT 1,
+    "dateCreated" TEXT NOT NULL,
+    "utcDateCreated" TEXT NOT NULL,
+    "dateModified" TEXT NOT NULL,
+    "utcDateModified" TEXT NOT NULL
+);
+
+CREATE INDEX "IDX_note_embeddings_noteId" ON "note_embeddings" ("noteId");
+CREATE INDEX "IDX_note_embeddings_providerId_modelId" ON "note_embeddings" ("providerId", "modelId");
+
+-- Table to track which notes need embedding updates
+CREATE TABLE IF NOT EXISTS "embedding_queue" (
+    "noteId" TEXT NOT NULL PRIMARY KEY,
+    "operation" TEXT NOT NULL, -- CREATE, UPDATE, DELETE
+    "dateQueued" TEXT NOT NULL,
+    "utcDateQueued" TEXT NOT NULL,
+    "priority" INTEGER NOT NULL DEFAULT 0,
+    "attempts" INTEGER NOT NULL DEFAULT 0,
+    "lastAttempt" TEXT NULL,
+    "error" TEXT NULL,
+    "failed" INTEGER NOT NULL DEFAULT 0,
+    "isProcessing" INTEGER NOT NULL DEFAULT 0
+);
+
+-- Table to store embedding provider configurations
+CREATE TABLE IF NOT EXISTS "embedding_providers" (
+    "providerId" TEXT NOT NULL PRIMARY KEY,
+    "name" TEXT NOT NULL,
+    "priority" INTEGER NOT NULL DEFAULT 0,
+    "config" TEXT NOT NULL, -- JSON config object
+    "dateCreated" TEXT NOT NULL,
+    "utcDateCreated" TEXT NOT NULL,
+    "dateModified" TEXT NOT NULL,
+    "utcDateModified" TEXT NOT NULL
+);
\ No newline at end of file
diff --git a/db/schema.sql b/db/schema.sql
index 8bf9db1e7..29b749d89 100644
--- a/db/schema.sql
+++ b/db/schema.sql
@@ -145,3 +145,45 @@ CREATE INDEX IDX_attachments_ownerId_role
 CREATE INDEX IDX_notes_blobId on notes (blobId);
 CREATE INDEX IDX_revisions_blobId on revisions (blobId);
 CREATE INDEX IDX_attachments_blobId on attachments (blobId);
+
+CREATE TABLE IF NOT EXISTS "note_embeddings" (
+    "embedId" TEXT NOT NULL PRIMARY KEY,
+    "noteId" TEXT NOT NULL,
+    "providerId" TEXT NOT NULL,
+    "modelId" TEXT NOT NULL,
+    "dimension" INTEGER NOT NULL,
+    "embedding" BLOB NOT NULL,
+    "version" INTEGER NOT NULL DEFAULT 1,
+    "dateCreated" TEXT NOT NULL,
+    "utcDateCreated" TEXT NOT NULL,
+    "dateModified" TEXT NOT NULL,
+    "utcDateModified" TEXT NOT NULL
+);
+
+CREATE INDEX "IDX_note_embeddings_noteId" ON "note_embeddings" ("noteId");
+CREATE INDEX "IDX_note_embeddings_providerId_modelId" ON "note_embeddings" ("providerId", "modelId");
+
+CREATE TABLE IF NOT EXISTS "embedding_queue" (
+    "noteId" TEXT NOT NULL PRIMARY KEY,
+    "operation" TEXT NOT NULL,
+    "dateQueued" TEXT NOT NULL,
+    "utcDateQueued" TEXT NOT NULL,
+    "priority" INTEGER NOT NULL DEFAULT 0,
+    "attempts" INTEGER NOT NULL DEFAULT 0,
+    "lastAttempt" TEXT NULL,
+    "error" TEXT NULL,
+    "failed" INTEGER NOT NULL DEFAULT 0,
+    "isProcessing" INTEGER NOT NULL DEFAULT 0
+);
+
+CREATE TABLE IF NOT EXISTS "embedding_providers" (
+    "providerId" TEXT NOT NULL PRIMARY KEY,
+    "name" TEXT NOT NULL,
+    "isEnabled" INTEGER NOT NULL DEFAULT 0,
+    "priority" INTEGER NOT NULL DEFAULT 0,
+    "config" TEXT NOT NULL,
+    "dateCreated" TEXT NOT NULL,
+    "utcDateCreated" TEXT NOT NULL,
+    "dateModified" TEXT NOT NULL,
+    "utcDateModified" TEXT NOT NULL
+);
diff --git a/docs/Developer Guide/!!!meta.json b/docs/Developer Guide/!!!meta.json
index af6ae2063..df3a5208e 100644
--- a/docs/Developer Guide/!!!meta.json	
+++ b/docs/Developer Guide/!!!meta.json	
@@ -1,6 +1,6 @@
 {
     "formatVersion": 2,
-    "appVersion": "0.92.7",
+    "appVersion": "0.93.0",
     "files": [
         {
             "isClone": false,
diff --git a/docs/Release Notes/!!!meta.json b/docs/Release Notes/!!!meta.json
index 9a5c041f1..7e22a4a32 100644
--- a/docs/Release Notes/!!!meta.json	
+++ b/docs/Release Notes/!!!meta.json	
@@ -1,6 +1,6 @@
 {
     "formatVersion": 2,
-    "appVersion": "0.92.7",
+    "appVersion": "0.93.0",
     "files": [
         {
             "isClone": false,
diff --git a/docs/Release Notes/Release Notes/v0.93.0.md b/docs/Release Notes/Release Notes/v0.93.0.md
index dcbbfc016..43425993f 100644
--- a/docs/Release Notes/Release Notes/v0.93.0.md	
+++ b/docs/Release Notes/Release Notes/v0.93.0.md	
@@ -1,5 +1,4 @@
 # v0.93.0
-
 ## 🐞 Bugfixes
 
 *   Calendar does not hide when clicking on a note by @JYC333
diff --git a/docs/User Guide/!!!meta.json b/docs/User Guide/!!!meta.json
index 374334fb7..1b716c2ba 100644
--- a/docs/User Guide/!!!meta.json	
+++ b/docs/User Guide/!!!meta.json	
@@ -1,6 +1,6 @@
 {
     "formatVersion": 2,
-    "appVersion": "0.92.7",
+    "appVersion": "0.93.0",
     "files": [
         {
             "isClone": false,
@@ -10598,6 +10598,369 @@
                         }
                     ]
                 },
+                {
+                    "isClone": false,
+                    "noteId": "LMAv4Uy3Wk6J",
+                    "notePath": [
+                        "pOsGYCXsbNQG",
+                        "LMAv4Uy3Wk6J"
+                    ],
+                    "title": "AI",
+                    "notePosition": 320,
+                    "prefix": null,
+                    "isExpanded": false,
+                    "type": "book",
+                    "mime": "",
+                    "attributes": [
+                        {
+                            "type": "label",
+                            "name": "iconClass",
+                            "value": "bx bx-bot",
+                            "isInheritable": false,
+                            "position": 10
+                        },
+                        {
+                            "type": "label",
+                            "name": "viewType",
+                            "value": "list",
+                            "isInheritable": false,
+                            "position": 20
+                        },
+                        {
+                            "type": "label",
+                            "name": "expanded",
+                            "value": "",
+                            "isInheritable": false,
+                            "position": 30
+                        }
+                    ],
+                    "attachments": [],
+                    "dirFileName": "AI",
+                    "children": [
+                        {
+                            "isClone": false,
+                            "noteId": "GBBMSlVSOIGP",
+                            "notePath": [
+                                "pOsGYCXsbNQG",
+                                "LMAv4Uy3Wk6J",
+                                "GBBMSlVSOIGP"
+                            ],
+                            "title": "Introduction",
+                            "notePosition": 10,
+                            "prefix": null,
+                            "isExpanded": false,
+                            "type": "text",
+                            "mime": "text/html",
+                            "attributes": [
+                                {
+                                    "type": "relation",
+                                    "name": "internalLink",
+                                    "value": "vvUCN7FDkq7G",
+                                    "isInheritable": false,
+                                    "position": 10
+                                }
+                            ],
+                            "format": "markdown",
+                            "dataFileName": "Introduction.md",
+                            "attachments": [
+                                {
+                                    "attachmentId": "4UpXwA3WvbmA",
+                                    "title": "image.png",
+                                    "role": "image",
+                                    "mime": "image/png",
+                                    "position": 10,
+                                    "dataFileName": "Introduction_image.png"
+                                },
+                                {
+                                    "attachmentId": "8Bn5IsE3Bv1k",
+                                    "title": "image.png",
+                                    "role": "image",
+                                    "mime": "image/png",
+                                    "position": 10,
+                                    "dataFileName": "1_Introduction_image.png"
+                                },
+                                {
+                                    "attachmentId": "ABN1rFIIJ8no",
+                                    "title": "image.png",
+                                    "role": "image",
+                                    "mime": "image/png",
+                                    "position": 10,
+                                    "dataFileName": "2_Introduction_image.png"
+                                },
+                                {
+                                    "attachmentId": "CK3z7sYw63XT",
+                                    "title": "image.png",
+                                    "role": "image",
+                                    "mime": "image/png",
+                                    "position": 10,
+                                    "dataFileName": "3_Introduction_image.png"
+                                },
+                                {
+                                    "attachmentId": "E6Y09N2t7vyA",
+                                    "title": "image.png",
+                                    "role": "image",
+                                    "mime": "image/png",
+                                    "position": 10,
+                                    "dataFileName": "4_Introduction_image.png"
+                                },
+                                {
+                                    "attachmentId": "JlIPeTtl5wlV",
+                                    "title": "image.png",
+                                    "role": "image",
+                                    "mime": "image/png",
+                                    "position": 10,
+                                    "dataFileName": "5_Introduction_image.png"
+                                },
+                                {
+                                    "attachmentId": "ur4TDJeRqpUC",
+                                    "title": "image.png",
+                                    "role": "image",
+                                    "mime": "image/png",
+                                    "position": 10,
+                                    "dataFileName": "6_Introduction_image.png"
+                                },
+                                {
+                                    "attachmentId": "UTH83LkQEA8u",
+                                    "title": "image.png",
+                                    "role": "image",
+                                    "mime": "image/png",
+                                    "position": 10,
+                                    "dataFileName": "7_Introduction_image.png"
+                                },
+                                {
+                                    "attachmentId": "V68TCCTUdyl7",
+                                    "title": "image.png",
+                                    "role": "image",
+                                    "mime": "image/png",
+                                    "position": 10,
+                                    "dataFileName": "8_Introduction_image.png"
+                                },
+                                {
+                                    "attachmentId": "YbWoNq58T9kB",
+                                    "title": "image.png",
+                                    "role": "image",
+                                    "mime": "image/png",
+                                    "position": 10,
+                                    "dataFileName": "9_Introduction_image.png"
+                                }
+                            ]
+                        },
+                        {
+                            "isClone": false,
+                            "noteId": "WkM7gsEUyCXs",
+                            "notePath": [
+                                "pOsGYCXsbNQG",
+                                "LMAv4Uy3Wk6J",
+                                "WkM7gsEUyCXs"
+                            ],
+                            "title": "AI Provider Information",
+                            "notePosition": 20,
+                            "prefix": null,
+                            "isExpanded": false,
+                            "type": "text",
+                            "mime": "text/html",
+                            "attributes": [
+                                {
+                                    "type": "relation",
+                                    "name": "internalLink",
+                                    "value": "7EdTxPADv95W",
+                                    "isInheritable": false,
+                                    "position": 10
+                                },
+                                {
+                                    "type": "relation",
+                                    "name": "internalLink",
+                                    "value": "ZavFigBX9AwP",
+                                    "isInheritable": false,
+                                    "position": 20
+                                },
+                                {
+                                    "type": "relation",
+                                    "name": "internalLink",
+                                    "value": "e0lkirXEiSNc",
+                                    "isInheritable": false,
+                                    "position": 30
+                                },
+                                {
+                                    "type": "label",
+                                    "name": "viewType",
+                                    "value": "list",
+                                    "isInheritable": false,
+                                    "position": 10
+                                }
+                            ],
+                            "format": "markdown",
+                            "dataFileName": "AI Provider Information.md",
+                            "attachments": [
+                                {
+                                    "attachmentId": "BNN9Vv3JEf2X",
+                                    "title": "image.png",
+                                    "role": "image",
+                                    "mime": "image/png",
+                                    "position": 10,
+                                    "dataFileName": "AI Provider Information_im.png"
+                                },
+                                {
+                                    "attachmentId": "diIollN3KEbn",
+                                    "title": "image.png",
+                                    "role": "image",
+                                    "mime": "image/png",
+                                    "position": 10,
+                                    "dataFileName": "1_AI Provider Information_im.png"
+                                }
+                            ],
+                            "dirFileName": "AI Provider Information",
+                            "children": [
+                                {
+                                    "isClone": false,
+                                    "noteId": "7EdTxPADv95W",
+                                    "notePath": [
+                                        "pOsGYCXsbNQG",
+                                        "LMAv4Uy3Wk6J",
+                                        "WkM7gsEUyCXs",
+                                        "7EdTxPADv95W"
+                                    ],
+                                    "title": "Ollama",
+                                    "notePosition": 10,
+                                    "prefix": null,
+                                    "isExpanded": false,
+                                    "type": "book",
+                                    "mime": "",
+                                    "attributes": [
+                                        {
+                                            "type": "label",
+                                            "name": "viewType",
+                                            "value": "list",
+                                            "isInheritable": false,
+                                            "position": 10
+                                        },
+                                        {
+                                            "type": "label",
+                                            "name": "expanded",
+                                            "value": "",
+                                            "isInheritable": false,
+                                            "position": 20
+                                        }
+                                    ],
+                                    "attachments": [],
+                                    "dirFileName": "Ollama",
+                                    "children": [
+                                        {
+                                            "isClone": false,
+                                            "noteId": "vvUCN7FDkq7G",
+                                            "notePath": [
+                                                "pOsGYCXsbNQG",
+                                                "LMAv4Uy3Wk6J",
+                                                "WkM7gsEUyCXs",
+                                                "7EdTxPADv95W",
+                                                "vvUCN7FDkq7G"
+                                            ],
+                                            "title": "Installing Ollama",
+                                            "notePosition": 10,
+                                            "prefix": null,
+                                            "isExpanded": false,
+                                            "type": "text",
+                                            "mime": "text/html",
+                                            "attributes": [],
+                                            "format": "markdown",
+                                            "dataFileName": "Installing Ollama.md",
+                                            "attachments": [
+                                                {
+                                                    "attachmentId": "CG9q2FfKuEsr",
+                                                    "title": "image.png",
+                                                    "role": "image",
+                                                    "mime": "image/png",
+                                                    "position": 10,
+                                                    "dataFileName": "Installing Ollama_image.png"
+                                                },
+                                                {
+                                                    "attachmentId": "GEcgXxUE1IDx",
+                                                    "title": "image.png",
+                                                    "role": "image",
+                                                    "mime": "image/png",
+                                                    "position": 10,
+                                                    "dataFileName": "1_Installing Ollama_image.png"
+                                                },
+                                                {
+                                                    "attachmentId": "OMGDDxjScXCl",
+                                                    "title": "image.png",
+                                                    "role": "image",
+                                                    "mime": "image/png",
+                                                    "position": 10,
+                                                    "dataFileName": "2_Installing Ollama_image.png"
+                                                },
+                                                {
+                                                    "attachmentId": "Qacg7ibmEBkZ",
+                                                    "title": "image.png",
+                                                    "role": "image",
+                                                    "mime": "image/png",
+                                                    "position": 10,
+                                                    "dataFileName": "3_Installing Ollama_image.png"
+                                                },
+                                                {
+                                                    "attachmentId": "vSjU929VnBm4",
+                                                    "title": "image.png",
+                                                    "role": "image",
+                                                    "mime": "image/png",
+                                                    "position": 10,
+                                                    "dataFileName": "4_Installing Ollama_image.png"
+                                                },
+                                                {
+                                                    "attachmentId": "xGrxARTj79Gv",
+                                                    "title": "image.png",
+                                                    "role": "image",
+                                                    "mime": "image/png",
+                                                    "position": 10,
+                                                    "dataFileName": "5_Installing Ollama_image.png"
+                                                }
+                                            ]
+                                        }
+                                    ]
+                                },
+                                {
+                                    "isClone": false,
+                                    "noteId": "ZavFigBX9AwP",
+                                    "notePath": [
+                                        "pOsGYCXsbNQG",
+                                        "LMAv4Uy3Wk6J",
+                                        "WkM7gsEUyCXs",
+                                        "ZavFigBX9AwP"
+                                    ],
+                                    "title": "OpenAI",
+                                    "notePosition": 20,
+                                    "prefix": null,
+                                    "isExpanded": false,
+                                    "type": "text",
+                                    "mime": "text/html",
+                                    "attributes": [],
+                                    "format": "markdown",
+                                    "dataFileName": "OpenAI.md",
+                                    "attachments": []
+                                },
+                                {
+                                    "isClone": false,
+                                    "noteId": "e0lkirXEiSNc",
+                                    "notePath": [
+                                        "pOsGYCXsbNQG",
+                                        "LMAv4Uy3Wk6J",
+                                        "WkM7gsEUyCXs",
+                                        "e0lkirXEiSNc"
+                                    ],
+                                    "title": "Anthropic",
+                                    "notePosition": 30,
+                                    "prefix": null,
+                                    "isExpanded": false,
+                                    "type": "text",
+                                    "mime": "text/html",
+                                    "attributes": [],
+                                    "format": "markdown",
+                                    "dataFileName": "Anthropic.md",
+                                    "attachments": []
+                                }
+                            ]
+                        }
+                    ]
+                },
                 {
                     "isClone": false,
                     "noteId": "CdNpE2pqjmI6",
@@ -10606,7 +10969,7 @@
                         "CdNpE2pqjmI6"
                     ],
                     "title": "Scripting",
-                    "notePosition": 320,
+                    "notePosition": 330,
                     "prefix": null,
                     "isExpanded": false,
                     "type": "text",
diff --git a/docs/User Guide/User Guide/AI/1_AI Provider Information_im.png b/docs/User Guide/User Guide/AI/1_AI Provider Information_im.png
new file mode 100644
index 000000000..80627e0b0
Binary files /dev/null and b/docs/User Guide/User Guide/AI/1_AI Provider Information_im.png differ
diff --git a/docs/User Guide/User Guide/AI/1_Introduction_image.png b/docs/User Guide/User Guide/AI/1_Introduction_image.png
new file mode 100644
index 000000000..c0955f2bf
Binary files /dev/null and b/docs/User Guide/User Guide/AI/1_Introduction_image.png differ
diff --git a/docs/User Guide/User Guide/AI/2_Introduction_image.png b/docs/User Guide/User Guide/AI/2_Introduction_image.png
new file mode 100644
index 000000000..3908a5f48
Binary files /dev/null and b/docs/User Guide/User Guide/AI/2_Introduction_image.png differ
diff --git a/docs/User Guide/User Guide/AI/3_Introduction_image.png b/docs/User Guide/User Guide/AI/3_Introduction_image.png
new file mode 100644
index 000000000..0fe0c8186
Binary files /dev/null and b/docs/User Guide/User Guide/AI/3_Introduction_image.png differ
diff --git a/docs/User Guide/User Guide/AI/4_Introduction_image.png b/docs/User Guide/User Guide/AI/4_Introduction_image.png
new file mode 100644
index 000000000..ef2ad8a0f
Binary files /dev/null and b/docs/User Guide/User Guide/AI/4_Introduction_image.png differ
diff --git a/docs/User Guide/User Guide/AI/5_Introduction_image.png b/docs/User Guide/User Guide/AI/5_Introduction_image.png
new file mode 100644
index 000000000..ede9d6aae
Binary files /dev/null and b/docs/User Guide/User Guide/AI/5_Introduction_image.png differ
diff --git a/docs/User Guide/User Guide/AI/6_Introduction_image.png b/docs/User Guide/User Guide/AI/6_Introduction_image.png
new file mode 100644
index 000000000..e784df790
Binary files /dev/null and b/docs/User Guide/User Guide/AI/6_Introduction_image.png differ
diff --git a/docs/User Guide/User Guide/AI/7_Introduction_image.png b/docs/User Guide/User Guide/AI/7_Introduction_image.png
new file mode 100644
index 000000000..96d56b39c
Binary files /dev/null and b/docs/User Guide/User Guide/AI/7_Introduction_image.png differ
diff --git a/docs/User Guide/User Guide/AI/8_Introduction_image.png b/docs/User Guide/User Guide/AI/8_Introduction_image.png
new file mode 100644
index 000000000..afb6653ca
Binary files /dev/null and b/docs/User Guide/User Guide/AI/8_Introduction_image.png differ
diff --git a/docs/User Guide/User Guide/AI/9_Introduction_image.png b/docs/User Guide/User Guide/AI/9_Introduction_image.png
new file mode 100644
index 000000000..f50f69553
Binary files /dev/null and b/docs/User Guide/User Guide/AI/9_Introduction_image.png differ
diff --git a/docs/User Guide/User Guide/AI/AI Provider Information.md b/docs/User Guide/User Guide/AI/AI Provider Information.md
new file mode 100644
index 000000000..333dcd184
--- /dev/null
+++ b/docs/User Guide/User Guide/AI/AI Provider Information.md	
@@ -0,0 +1,15 @@
+# AI Provider Information
+Currently, we support the following providers:
+
+*   <a class="reference-link" href="AI%20Provider%20Information/Ollama">Ollama</a>
+*   <a class="reference-link" href="AI%20Provider%20Information/OpenAI.md">OpenAI</a>
+*   <a class="reference-link" href="AI%20Provider%20Information/Anthropic.md">Anthropic</a>
+*   Voyage AI
+
+To set your preferred chat model, you'll want to enter the provider's name here:
+
+<figure class="image image_resized" style="width:88.38%;"><img style="aspect-ratio:1884/1267;" src="AI Provider Information_im.png" width="1884" height="1267"></figure>
+
+And to set your preferred embedding provider:
+
+<figure class="image image_resized" style="width:93.47%;"><img style="aspect-ratio:1907/1002;" src="1_AI Provider Information_im.png" width="1907" height="1002"></figure>
\ No newline at end of file
diff --git a/docs/User Guide/User Guide/AI/AI Provider Information/Anthropic.md b/docs/User Guide/User Guide/AI/AI Provider Information/Anthropic.md
new file mode 100644
index 000000000..e69de29bb
diff --git a/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/1_Installing Ollama_image.png b/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/1_Installing Ollama_image.png
new file mode 100644
index 000000000..821966b77
Binary files /dev/null and b/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/1_Installing Ollama_image.png differ
diff --git a/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/2_Installing Ollama_image.png b/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/2_Installing Ollama_image.png
new file mode 100644
index 000000000..7e585a751
Binary files /dev/null and b/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/2_Installing Ollama_image.png differ
diff --git a/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/3_Installing Ollama_image.png b/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/3_Installing Ollama_image.png
new file mode 100644
index 000000000..0a239f35c
Binary files /dev/null and b/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/3_Installing Ollama_image.png differ
diff --git a/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/4_Installing Ollama_image.png b/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/4_Installing Ollama_image.png
new file mode 100644
index 000000000..b5c4c2930
Binary files /dev/null and b/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/4_Installing Ollama_image.png differ
diff --git a/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/5_Installing Ollama_image.png b/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/5_Installing Ollama_image.png
new file mode 100644
index 000000000..0c02db50f
Binary files /dev/null and b/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/5_Installing Ollama_image.png differ
diff --git a/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/Installing Ollama.md b/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/Installing Ollama.md
new file mode 100644
index 000000000..650ac76e9
--- /dev/null
+++ b/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/Installing Ollama.md	
@@ -0,0 +1,25 @@
+# Installing Ollama
+[Ollama](https://ollama.com/) can be installed in a variety of ways, and even runs [within a Docker container](https://hub.docker.com/r/ollama/ollama). Ollama will be noticeably quicker when running on a GPU (Nvidia, AMD, Intel), but it can run on CPU and RAM. To install Ollama without any other prerequisites, you can follow their [installer](https://ollama.com/download):
+
+<figure class="image image_resized" style="width:50.49%;"><img style="aspect-ratio:785/498;" src="3_Installing Ollama_image.png" width="785" height="498"></figure><figure class="image image_resized" style="width:40.54%;"><img style="aspect-ratio:467/100;" src="Installing Ollama_image.png" width="467" height="100"></figure><figure class="image image_resized" style="width:55.73%;"><img style="aspect-ratio:1296/1011;" src="1_Installing Ollama_image.png" width="1296" height="1011"></figure>
+
+After their installer completes, if you're on Windows, you should see an entry in the start menu to run it:
+
+<figure class="image image_resized" style="width:66.12%;"><img style="aspect-ratio:1161/480;" src="2_Installing Ollama_image.png" width="1161" height="480"></figure>
+
+Also, you should have access to the `ollama` CLI via Powershell or CMD:
+
+<figure class="image image_resized" style="width:86.09%;"><img style="aspect-ratio:1730/924;" src="5_Installing Ollama_image.png" width="1730" height="924"></figure>
+
+After Ollama is installed, you can go ahead and `pull` the models you want to use and run. Here's a command to pull my favorite tool-compatible model and embedding model as of April 2025:
+
+```
+ollama pull llama3.1:8b
+ollama pull mxbai-embed-large
+```
+
+Also, you can make sure it's running by going to [http://localhost:11434](http://localhost:11434) and you should get the following response (port 11434 being the “normal” Ollama port):
+
+<figure class="image"><img style="aspect-ratio:585/202;" src="4_Installing Ollama_image.png" width="585" height="202"></figure>
+
+Now that you have Ollama up and running, have a few models pulled, you're ready to go to go ahead and start using Ollama as both a chat provider, and embedding provider!
\ No newline at end of file
diff --git a/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/Installing Ollama_image.png b/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/Installing Ollama_image.png
new file mode 100644
index 000000000..cf5ee38d4
Binary files /dev/null and b/docs/User Guide/User Guide/AI/AI Provider Information/Ollama/Installing Ollama_image.png differ
diff --git a/docs/User Guide/User Guide/AI/AI Provider Information/OpenAI.md b/docs/User Guide/User Guide/AI/AI Provider Information/OpenAI.md
new file mode 100644
index 000000000..e69de29bb
diff --git a/docs/User Guide/User Guide/AI/AI Provider Information_im.png b/docs/User Guide/User Guide/AI/AI Provider Information_im.png
new file mode 100644
index 000000000..aa19e949d
Binary files /dev/null and b/docs/User Guide/User Guide/AI/AI Provider Information_im.png differ
diff --git a/docs/User Guide/User Guide/AI/Introduction.md b/docs/User Guide/User Guide/AI/Introduction.md
new file mode 100644
index 000000000..5591e0834
--- /dev/null
+++ b/docs/User Guide/User Guide/AI/Introduction.md	
@@ -0,0 +1,89 @@
+# Introduction
+<figure class="image image_resized" style="width:63.68%;"><img style="aspect-ratio:1363/1364;" src="Introduction_image.png" width="1363" height="1364"><figcaption>An example chat with an LLM</figcaption></figure>
+
+The AI / LLM features within Trilium Notes are designed to allow you to interact with your Notes in a variety of ways, using as many of the major providers as we can support. 
+
+In addition to being able to send chats to LLM providers such as OpenAI, Anthropic, and Ollama - we also support agentic tool calling, and embeddings.
+
+The quickest way to get started is to navigate to the “AI/LLM” settings:
+
+<figure class="image image_resized" style="width:74.04%;"><img style="aspect-ratio:1916/1906;" src="5_Introduction_image.png" width="1916" height="1906"></figure>
+
+Enable the feature:
+
+<figure class="image image_resized" style="width:82.82%;"><img style="aspect-ratio:1911/997;" src="1_Introduction_image.png" width="1911" height="997"></figure>
+
+## Embeddings
+
+**Embeddings** are important as it allows us to have an compact AI “summary” (it's not human readable text) of each of your Notes, that we can then perform mathematical functions on (such as cosine similarity) to smartly figure out which Notes to send as context to the LLM when you're chatting, among other useful functions.
+
+You will then need to set up the AI “provider” that you wish to use to create the embeddings for your Notes. Currently OpenAI, Voyage AI, and Ollama are supported providers for embedding generation.
+
+In the following example, we're going to use our self-hosted Ollama instance to create the embeddings for our Notes. You can see additional documentation about installing your own Ollama locally in <a class="reference-link" href="AI%20Provider%20Information/Ollama/Installing%20Ollama.md">Installing Ollama</a>.
+
+To see what embedding models Ollama has available, you can check out [this search](https://ollama.com/search?c=embedding)on their website, and then `pull` whichever one you want to try out. As of 4/15/25, my personal favorite is `mxbai-embed-large`.
+
+First, we'll need to select the Ollama provider from the tabs of providers, then we will enter in the Base URL for our Ollama. Since our Ollama is running on our local machine, our Base URL is `http://localhost:11434`. We will then hit the “refresh” button to have it fetch our models:
+
+<figure class="image image_resized" style="width:82.28%;"><img style="aspect-ratio:1912/1075;" src="4_Introduction_image.png" width="1912" height="1075"></figure>
+
+When selecting the dropdown for the “Embedding Model”, embedding models should be at the top of the list, separated by regular chat models with a horizontal line, as seen below:
+
+<figure class="image image_resized" style="width:61.73%;"><img style="aspect-ratio:1232/959;" src="8_Introduction_image.png" width="1232" height="959"></figure>
+
+After selecting an embedding model, embeddings should automatically begin to be generated by checking the embedding statistics at the top of the “AI/LLM” settings panel:
+
+<figure class="image image_resized" style="width:67.06%;"><img style="aspect-ratio:1333/499;" src="7_Introduction_image.png" width="1333" height="499"></figure>
+
+If you don't see any embeddings being created, you will want to scroll to the bottom of the settings, and hit “Recreate All Embeddings”:
+
+<figure class="image image_resized" style="width:65.69%;"><img style="aspect-ratio:1337/1490;" src="3_Introduction_image.png" width="1337" height="1490"></figure>
+
+Creating the embeddings will take some time, and will be regenerated when a Note is created, updated, or deleted (removed).
+
+If for some reason you choose to change your embedding provider, or the model used, you'll need to recreate all embeddings.
+
+## Tools
+
+Tools are essentially functions that we provide to the various LLM providers, and then LLMs can respond in a specific format that tells us what tool function and parameters they would like to invoke. We then execute these tools, and provide it as additional context in the Chat conversation. 
+
+These are the tools that currently exist, and will certainly be updated to be more effectively (and even more to be added!):
+
+*   `search_notes`
+    *   Semantic search
+*   `keyword_search`
+    *   Keyword-based search
+*   `attribute_search`
+    *   Attribute-specific search
+*   `search_suggestion`
+    *   Search syntax helper
+*   `read_note`
+    *   Read note content (helps the LLM read Notes)
+*   `create_note`
+    *   Create a Note
+*   `update_note`
+    *   Update a Note
+*   `manage_attributes`
+    *   Manage attributes on a Note
+*   `manage_relationships`
+    *   Manage the various relationships between Notes
+*   `extract_content`
+    *   Used to smartly extract content from a Note
+*   `calendar_integration`
+    *   Used to find date notes, create date notes, get the daily note, etc.
+
+When Tools are executed within your Chat, you'll see output like the following:
+
+<figure class="image image_resized" style="width:66.88%;"><img style="aspect-ratio:1372/1591;" src="6_Introduction_image.png" width="1372" height="1591"></figure>
+
+You don't need to tell the LLM to execute a certain tool, it should “smartly” call tools and automatically execute them as needed.
+
+## Overview
+
+Now that you know about embeddings and tools, you can just go ahead and use the “Chat with Notes” button, where you can go ahead and start chatting!:
+
+<figure class="image image_resized" style="width:60.77%;"><img style="aspect-ratio:1378/539;" src="2_Introduction_image.png" width="1378" height="539"></figure>
+
+If you don't see the “Chat with Notes” button on your side launchbar, you might need to move it from the “Available Launchers” section to the “Visible Launchers” section:
+
+<figure class="image image_resized" style="width:69.81%;"><img style="aspect-ratio:1765/1287;" src="9_Introduction_image.png" width="1765" height="1287"></figure>
\ No newline at end of file
diff --git a/docs/User Guide/User Guide/AI/Introduction_image.png b/docs/User Guide/User Guide/AI/Introduction_image.png
new file mode 100644
index 000000000..5a8657faf
Binary files /dev/null and b/docs/User Guide/User Guide/AI/Introduction_image.png differ
diff --git a/package-lock.json b/package-lock.json
index c21f48503..581465dc8 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -9,6 +9,7 @@
       "version": "0.93.0",
       "license": "AGPL-3.0-only",
       "dependencies": {
+        "@anthropic-ai/sdk": "0.39.0",
         "@braintree/sanitize-url": "7.1.1",
         "@electron/remote": "2.1.2",
         "@highlightjs/cdn-assets": "11.11.1",
@@ -67,6 +68,8 @@
         "multer": "1.4.5-lts.2",
         "normalize-strings": "1.1.1",
         "normalize.css": "8.0.1",
+        "ollama": "0.5.14",
+        "openai": "4.93.0",
         "rand-token": "1.0.1",
         "safe-compare": "1.1.4",
         "sanitize-filename": "1.6.3",
@@ -254,6 +257,36 @@
         "url": "https://github.com/sponsors/antfu"
       }
     },
+    "node_modules/@anthropic-ai/sdk": {
+      "version": "0.39.0",
+      "resolved": "https://registry.npmjs.org/@anthropic-ai/sdk/-/sdk-0.39.0.tgz",
+      "integrity": "sha512-eMyDIPRZbt1CCLErRCi3exlAvNkBtRe+kW5vvJyef93PmNr/clstYgHhtvmkxN82nlKgzyGPCyGxrm0JQ1ZIdg==",
+      "license": "MIT",
+      "dependencies": {
+        "@types/node": "^18.11.18",
+        "@types/node-fetch": "^2.6.4",
+        "abort-controller": "^3.0.0",
+        "agentkeepalive": "^4.2.1",
+        "form-data-encoder": "1.7.2",
+        "formdata-node": "^4.3.2",
+        "node-fetch": "^2.6.7"
+      }
+    },
+    "node_modules/@anthropic-ai/sdk/node_modules/@types/node": {
+      "version": "18.19.86",
+      "resolved": "https://registry.npmjs.org/@types/node/-/node-18.19.86.tgz",
+      "integrity": "sha512-fifKayi175wLyKyc5qUfyENhQ1dCNI1UNjp653d8kuYcPQN5JhX3dGuP/XmvPTg/xRBn1VTLpbmi+H/Mr7tLfQ==",
+      "license": "MIT",
+      "dependencies": {
+        "undici-types": "~5.26.4"
+      }
+    },
+    "node_modules/@anthropic-ai/sdk/node_modules/undici-types": {
+      "version": "5.26.5",
+      "resolved": "https://registry.npmjs.org/undici-types/-/undici-types-5.26.5.tgz",
+      "integrity": "sha512-JlCMO+ehdEIKqlFxk6IfVoAUVmgz7cU7zD/h9XZ0qzeosSHmUJVOzSQvvYSYWXkFXC+IfLKSIffhv0sVZup6pA==",
+      "license": "MIT"
+    },
     "node_modules/@apidevtools/json-schema-ref-parser": {
       "version": "9.1.2",
       "resolved": "https://registry.npmjs.org/@apidevtools/json-schema-ref-parser/-/json-schema-ref-parser-9.1.2.tgz",
@@ -5260,6 +5293,16 @@
         "undici-types": "~6.21.0"
       }
     },
+    "node_modules/@types/node-fetch": {
+      "version": "2.6.12",
+      "resolved": "https://registry.npmjs.org/@types/node-fetch/-/node-fetch-2.6.12.tgz",
+      "integrity": "sha512-8nneRWKCg3rMtF69nLQJnOYUcbafYeFSjqkw3jCRLsqkWFlHaoQrr5mXmofFGOx3DKn7UfmBMyov8ySvLRVldA==",
+      "license": "MIT",
+      "dependencies": {
+        "@types/node": "*",
+        "form-data": "^4.0.0"
+      }
+    },
     "node_modules/@types/prop-types": {
       "version": "15.7.14",
       "resolved": "https://registry.npmjs.org/@types/prop-types/-/prop-types-15.7.14.tgz",
@@ -6238,7 +6281,6 @@
       "version": "4.5.0",
       "resolved": "https://registry.npmjs.org/agentkeepalive/-/agentkeepalive-4.5.0.tgz",
       "integrity": "sha512-5GG/5IbQQpC9FpkRGsSvZI5QYeSCzlJHdpBQntCsuTOxhKD8lqKhrleg2Yi7yvMIf82Ycmmqln9U8V9qwEiJew==",
-      "dev": true,
       "license": "MIT",
       "dependencies": {
         "humanize-ms": "^1.2.1"
@@ -10299,7 +10341,6 @@
       "version": "0.1.13",
       "resolved": "https://registry.npmjs.org/encoding/-/encoding-0.1.13.tgz",
       "integrity": "sha512-ETBauow1T35Y/WZMkio9jiM0Z5xjHHmJ4XmjZOq1l/dXz3lr2sRn87nJy20RupqSh1F2m3HHPSp8ShIPQJrJ3A==",
-      "dev": true,
       "license": "MIT",
       "optional": true,
       "dependencies": {
@@ -11670,6 +11711,12 @@
         "node": ">= 6"
       }
     },
+    "node_modules/form-data-encoder": {
+      "version": "1.7.2",
+      "resolved": "https://registry.npmjs.org/form-data-encoder/-/form-data-encoder-1.7.2.tgz",
+      "integrity": "sha512-qfqtYan3rxrnCk1VYaA4H+Ms9xdpPqvLZa6xmMgFvhO32x7/3J/ExcTd6qpxM0vH2GdMI+poehyBZvqfMTto8A==",
+      "license": "MIT"
+    },
     "node_modules/form-data/node_modules/mime-db": {
       "version": "1.52.0",
       "resolved": "https://registry.npmjs.org/mime-db/-/mime-db-1.52.0.tgz",
@@ -11691,6 +11738,19 @@
         "node": ">= 0.6"
       }
     },
+    "node_modules/formdata-node": {
+      "version": "4.4.1",
+      "resolved": "https://registry.npmjs.org/formdata-node/-/formdata-node-4.4.1.tgz",
+      "integrity": "sha512-0iirZp3uVDjVGt9p49aTaqjk84TrglENEDuqfdlZQ1roC9CWlPk6Avf8EEnZNcAqPonwkG35x4n3ww/1THYAeQ==",
+      "license": "MIT",
+      "dependencies": {
+        "node-domexception": "1.0.0",
+        "web-streams-polyfill": "4.0.0-beta.3"
+      },
+      "engines": {
+        "node": ">= 12.20"
+      }
+    },
     "node_modules/formidable": {
       "version": "3.5.2",
       "resolved": "https://registry.npmjs.org/formidable/-/formidable-3.5.2.tgz",
@@ -12666,7 +12726,6 @@
       "version": "1.2.1",
       "resolved": "https://registry.npmjs.org/humanize-ms/-/humanize-ms-1.2.1.tgz",
       "integrity": "sha512-Fl70vYtsAFb/C06PTS9dZBo7ihau+Tu/DNCk/OyHhea07S+aeMWpFFkUaXRa8fI+ScZbEI8dfSxwY7gxZ9SAVQ==",
-      "dev": true,
       "license": "MIT",
       "dependencies": {
         "ms": "^2.0.0"
@@ -15516,11 +15575,29 @@
         "semver": "^7.3.5"
       }
     },
+    "node_modules/node-domexception": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/node-domexception/-/node-domexception-1.0.0.tgz",
+      "integrity": "sha512-/jKZoMpw0F8GRwl4/eLROPA3cfcXtLApP0QzLmUT/HuPCZWyB7IY9ZrMeKw2O/nFIqPQB3PVM9aYm0F312AXDQ==",
+      "funding": [
+        {
+          "type": "github",
+          "url": "https://github.com/sponsors/jimmywarting"
+        },
+        {
+          "type": "github",
+          "url": "https://paypal.me/jimmywarting"
+        }
+      ],
+      "license": "MIT",
+      "engines": {
+        "node": ">=10.5.0"
+      }
+    },
     "node_modules/node-fetch": {
       "version": "2.7.0",
       "resolved": "https://registry.npmjs.org/node-fetch/-/node-fetch-2.7.0.tgz",
       "integrity": "sha512-c4FRfUm/dbcWZ7U+1Wq0AwCyFL+3nt2bEw05wfxSz+DWpWsitgmSgYmy2dQdWyKC1694ELPqMs/YzUSNozLt8A==",
-      "dev": true,
       "license": "MIT",
       "dependencies": {
         "whatwg-url": "^5.0.0"
@@ -15541,21 +15618,18 @@
       "version": "0.0.3",
       "resolved": "https://registry.npmjs.org/tr46/-/tr46-0.0.3.tgz",
       "integrity": "sha512-N3WMsuqV66lT30CrXNbEjx4GEwlow3v6rr4mCcv6prnfwhS01rkgyFdjPNBYd9br7LpXV1+Emh01fHnq2Gdgrw==",
-      "dev": true,
       "license": "MIT"
     },
     "node_modules/node-fetch/node_modules/webidl-conversions": {
       "version": "3.0.1",
       "resolved": "https://registry.npmjs.org/webidl-conversions/-/webidl-conversions-3.0.1.tgz",
       "integrity": "sha512-2JAn3z8AR6rjK8Sm8orRC0h/bcl/DqL7tRPdGZ4I1CjdF+EaMLmYxBHyXuKL849eucPFhvBoxMsflfOb8kxaeQ==",
-      "dev": true,
       "license": "BSD-2-Clause"
     },
     "node_modules/node-fetch/node_modules/whatwg-url": {
       "version": "5.0.0",
       "resolved": "https://registry.npmjs.org/whatwg-url/-/whatwg-url-5.0.0.tgz",
       "integrity": "sha512-saE57nupxk6v3HY35+jzBwYa0rKSy0XR8JSxZPwgLr7ys0IBzhGviA1/TUGJLmSVqs8pb9AnvICXEuOHLprYTw==",
-      "dev": true,
       "license": "MIT",
       "dependencies": {
         "tr46": "~0.0.3",
@@ -15851,6 +15925,15 @@
         "node": "^10.13.0 || >=12.0.0"
       }
     },
+    "node_modules/ollama": {
+      "version": "0.5.14",
+      "resolved": "https://registry.npmjs.org/ollama/-/ollama-0.5.14.tgz",
+      "integrity": "sha512-pvOuEYa2WkkAumxzJP0RdEYHkbZ64AYyyUszXVX7ruLvk5L+EiO2G71da2GqEQ4IAk4j6eLoUbGk5arzFT1wJA==",
+      "license": "MIT",
+      "dependencies": {
+        "whatwg-fetch": "^3.6.20"
+      }
+    },
     "node_modules/omggif": {
       "version": "1.0.10",
       "resolved": "https://registry.npmjs.org/omggif/-/omggif-1.0.10.tgz",
@@ -15910,6 +15993,51 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/openai": {
+      "version": "4.93.0",
+      "resolved": "https://registry.npmjs.org/openai/-/openai-4.93.0.tgz",
+      "integrity": "sha512-2kONcISbThKLfm7T9paVzg+QCE1FOZtNMMUfXyXckUAoXRRS/mTP89JSDHPMp8uM5s0bz28RISbvQjArD6mgUQ==",
+      "license": "Apache-2.0",
+      "dependencies": {
+        "@types/node": "^18.11.18",
+        "@types/node-fetch": "^2.6.4",
+        "abort-controller": "^3.0.0",
+        "agentkeepalive": "^4.2.1",
+        "form-data-encoder": "1.7.2",
+        "formdata-node": "^4.3.2",
+        "node-fetch": "^2.6.7"
+      },
+      "bin": {
+        "openai": "bin/cli"
+      },
+      "peerDependencies": {
+        "ws": "^8.18.0",
+        "zod": "^3.23.8"
+      },
+      "peerDependenciesMeta": {
+        "ws": {
+          "optional": true
+        },
+        "zod": {
+          "optional": true
+        }
+      }
+    },
+    "node_modules/openai/node_modules/@types/node": {
+      "version": "18.19.86",
+      "resolved": "https://registry.npmjs.org/@types/node/-/node-18.19.86.tgz",
+      "integrity": "sha512-fifKayi175wLyKyc5qUfyENhQ1dCNI1UNjp653d8kuYcPQN5JhX3dGuP/XmvPTg/xRBn1VTLpbmi+H/Mr7tLfQ==",
+      "license": "MIT",
+      "dependencies": {
+        "undici-types": "~5.26.4"
+      }
+    },
+    "node_modules/openai/node_modules/undici-types": {
+      "version": "5.26.5",
+      "resolved": "https://registry.npmjs.org/undici-types/-/undici-types-5.26.5.tgz",
+      "integrity": "sha512-JlCMO+ehdEIKqlFxk6IfVoAUVmgz7cU7zD/h9XZ0qzeosSHmUJVOzSQvvYSYWXkFXC+IfLKSIffhv0sVZup6pA==",
+      "license": "MIT"
+    },
     "node_modules/openapi-types": {
       "version": "12.1.3",
       "resolved": "https://registry.npmjs.org/openapi-types/-/openapi-types-12.1.3.tgz",
@@ -21056,6 +21184,15 @@
         "defaults": "^1.0.3"
       }
     },
+    "node_modules/web-streams-polyfill": {
+      "version": "4.0.0-beta.3",
+      "resolved": "https://registry.npmjs.org/web-streams-polyfill/-/web-streams-polyfill-4.0.0-beta.3.tgz",
+      "integrity": "sha512-QW95TCTaHmsYfHDybGMwO5IJIM93I/6vTRk+daHTWFPhwh+C8Cg7j7XyKrwrj8Ib6vYXe0ocYNrmzY4xAAN6ug==",
+      "license": "MIT",
+      "engines": {
+        "node": ">= 14"
+      }
+    },
     "node_modules/web-worker": {
       "version": "1.5.0",
       "resolved": "https://registry.npmjs.org/web-worker/-/web-worker-1.5.0.tgz",
@@ -21292,6 +21429,12 @@
         "node": ">=18"
       }
     },
+    "node_modules/whatwg-fetch": {
+      "version": "3.6.20",
+      "resolved": "https://registry.npmjs.org/whatwg-fetch/-/whatwg-fetch-3.6.20.tgz",
+      "integrity": "sha512-EqhiFU6daOA8kpjOWTL0olhVOF3i7OrFzSYiGsEMB8GcXS+RrzauAERX65xMeNWVqxA6HXH2m69Z9LaKKdisfg==",
+      "license": "MIT"
+    },
     "node_modules/whatwg-mimetype": {
       "version": "4.0.0",
       "resolved": "https://registry.npmjs.org/whatwg-mimetype/-/whatwg-mimetype-4.0.0.tgz",
diff --git a/package.json b/package.json
index 6803b838d..d766e456d 100644
--- a/package.json
+++ b/package.json
@@ -69,6 +69,7 @@
     "chore:generate-openapi": "tsx bin/generate-openapi.js"
   },
   "dependencies": {
+    "@anthropic-ai/sdk": "0.39.0",
     "@braintree/sanitize-url": "7.1.1",
     "@electron/remote": "2.1.2",
     "@highlightjs/cdn-assets": "11.11.1",
@@ -127,6 +128,8 @@
     "multer": "1.4.5-lts.2",
     "normalize-strings": "1.1.1",
     "normalize.css": "8.0.1",
+    "ollama": "0.5.14",
+    "openai": "4.93.0",
     "rand-token": "1.0.1",
     "safe-compare": "1.1.4",
     "sanitize-filename": "1.6.3",
diff --git a/src/app.ts b/src/app.ts
index 58dfaa4ce..66007a4fd 100644
--- a/src/app.ts
+++ b/src/app.ts
@@ -18,6 +18,8 @@ import sql_init from "./services/sql_init.js";
 import { auth } from "express-openid-connect";
 import openID from "./services/open_id.js";
 import { t } from "i18next";
+import eventService from "./services/events.js";
+import log from "./services/log.js";
 
 await import("./services/handlers.js");
 await import("./becca/becca_loader.js");
@@ -29,6 +31,42 @@ const scriptDir = dirname(fileURLToPath(import.meta.url));
 // Initialize DB
 sql_init.initializeDb();
 
+// Listen for database initialization event
+eventService.subscribe(eventService.DB_INITIALIZED, async () => {
+    try {
+        log.info("Database initialized, setting up LLM features");
+
+        // Initialize embedding providers
+        const { initializeEmbeddings } = await import("./services/llm/embeddings/init.js");
+        await initializeEmbeddings();
+
+        // Initialize the index service for LLM functionality
+        const { default: indexService } = await import("./services/llm/index_service.js");
+        await indexService.initialize().catch(e => console.error("Failed to initialize index service:", e));
+
+        log.info("LLM features initialized successfully");
+    } catch (error) {
+        console.error("Error initializing LLM features:", error);
+    }
+});
+
+// Initialize LLM features only if database is already initialized
+if (sql_init.isDbInitialized()) {
+    try {
+        // Initialize embedding providers
+        const { initializeEmbeddings } = await import("./services/llm/embeddings/init.js");
+        await initializeEmbeddings();
+
+        // Initialize the index service for LLM functionality
+        const { default: indexService } = await import("./services/llm/index_service.js");
+        await indexService.initialize().catch(e => console.error("Failed to initialize index service:", e));
+    } catch (error) {
+        console.error("Error initializing LLM features:", error);
+    }
+} else {
+    console.log("Database not initialized yet. LLM features will be initialized after setup.");
+}
+
 // view engine setup
 app.set("views", path.join(scriptDir, "views"));
 app.set("view engine", "ejs");
diff --git a/src/becca/entities/bnote_embedding.ts b/src/becca/entities/bnote_embedding.ts
new file mode 100644
index 000000000..2f696ee6f
--- /dev/null
+++ b/src/becca/entities/bnote_embedding.ts
@@ -0,0 +1,73 @@
+import AbstractBeccaEntity from "./abstract_becca_entity.js";
+import dateUtils from "../../services/date_utils.js";
+import type { NoteEmbeddingRow } from "./rows.js";
+
+/**
+ * Entity representing a note's vector embedding for semantic search and AI features
+ */
+class BNoteEmbedding extends AbstractBeccaEntity<BNoteEmbedding> {
+    static get entityName() {
+        return "note_embeddings";
+    }
+    static get primaryKeyName() {
+        return "embedId";
+    }
+    static get hashedProperties() {
+        return ["embedId", "noteId", "providerId", "modelId", "dimension", "version"];
+    }
+
+    embedId!: string;
+    noteId!: string;
+    providerId!: string;
+    modelId!: string;
+    dimension!: number;
+    embedding!: Buffer;
+    version!: number;
+
+    constructor(row?: NoteEmbeddingRow) {
+        super();
+
+        if (row) {
+            this.updateFromRow(row);
+        }
+    }
+
+    updateFromRow(row: NoteEmbeddingRow): void {
+        this.embedId = row.embedId;
+        this.noteId = row.noteId;
+        this.providerId = row.providerId;
+        this.modelId = row.modelId;
+        this.dimension = row.dimension;
+        this.embedding = row.embedding;
+        this.version = row.version;
+        this.dateCreated = row.dateCreated;
+        this.dateModified = row.dateModified;
+        this.utcDateCreated = row.utcDateCreated;
+        this.utcDateModified = row.utcDateModified;
+    }
+
+    beforeSaving() {
+        super.beforeSaving();
+
+        this.dateModified = dateUtils.localNowDateTime();
+        this.utcDateModified = dateUtils.utcNowDateTime();
+    }
+
+    getPojo(): NoteEmbeddingRow {
+        return {
+            embedId: this.embedId,
+            noteId: this.noteId,
+            providerId: this.providerId,
+            modelId: this.modelId,
+            dimension: this.dimension,
+            embedding: this.embedding,
+            version: this.version,
+            dateCreated: this.dateCreated!,
+            dateModified: this.dateModified!,
+            utcDateCreated: this.utcDateCreated,
+            utcDateModified: this.utcDateModified!
+        };
+    }
+}
+
+export default BNoteEmbedding;
diff --git a/src/becca/entities/rows.ts b/src/becca/entities/rows.ts
index 3730ed922..6b7d73a7e 100644
--- a/src/becca/entities/rows.ts
+++ b/src/becca/entities/rows.ts
@@ -139,3 +139,17 @@ export interface NoteRow {
     utcDateModified: string;
     content?: string | Buffer;
 }
+
+export interface NoteEmbeddingRow {
+    embedId: string;
+    noteId: string;
+    providerId: string;
+    modelId: string;
+    dimension: number;
+    embedding: Buffer;
+    version: number;
+    dateCreated: string;
+    utcDateCreated: string;
+    dateModified: string;
+    utcDateModified: string;
+}
diff --git a/src/becca/entity_constructor.ts b/src/becca/entity_constructor.ts
index 18f7a14c7..882f62492 100644
--- a/src/becca/entity_constructor.ts
+++ b/src/becca/entity_constructor.ts
@@ -6,6 +6,7 @@ import BBlob from "./entities/bblob.js";
 import BBranch from "./entities/bbranch.js";
 import BEtapiToken from "./entities/betapi_token.js";
 import BNote from "./entities/bnote.js";
+import BNoteEmbedding from "./entities/bnote_embedding.js";
 import BOption from "./entities/boption.js";
 import BRecentNote from "./entities/brecent_note.js";
 import BRevision from "./entities/brevision.js";
@@ -19,6 +20,7 @@ const ENTITY_NAME_TO_ENTITY: Record<string, ConstructorData<any> & EntityClass>
     branches: BBranch,
     etapi_tokens: BEtapiToken,
     notes: BNote,
+    note_embeddings: BNoteEmbedding,
     options: BOption,
     recent_notes: BRecentNote,
     revisions: BRevision
diff --git a/src/public/app/components/app_context.ts b/src/public/app/components/app_context.ts
index ff1f3fa50..57811da7e 100644
--- a/src/public/app/components/app_context.ts
+++ b/src/public/app/components/app_context.ts
@@ -89,6 +89,8 @@ export type CommandMappings = {
     closeHlt: CommandData;
     showLaunchBarSubtree: CommandData;
     showRevisions: CommandData;
+    showLlmChat: CommandData;
+    createAiChat: CommandData;
     showOptions: CommandData & {
         section: string;
     };
diff --git a/src/public/app/components/root_command_executor.ts b/src/public/app/components/root_command_executor.ts
index eb46e3139..1e16fae81 100644
--- a/src/public/app/components/root_command_executor.ts
+++ b/src/public/app/components/root_command_executor.ts
@@ -7,6 +7,9 @@ import protectedSessionService from "../services/protected_session.js";
 import options from "../services/options.js";
 import froca from "../services/froca.js";
 import utils from "../services/utils.js";
+import LlmChatPanel from "../widgets/llm_chat_panel.js";
+import toastService from "../services/toast.js";
+import noteCreateService from "../services/note_create.js";
 
 export default class RootCommandExecutor extends Component {
     editReadOnlyNoteCommand() {
@@ -226,4 +229,35 @@ export default class RootCommandExecutor extends Component {
             appContext.tabManager.activateNoteContext(tab.ntxId);
         }
     }
+
+    async createAiChatCommand() {
+        try {
+            // Create a new AI Chat note at the root level
+            const rootNoteId = "root";
+
+            const result = await noteCreateService.createNote(rootNoteId, {
+                title: "New AI Chat",
+                type: "aiChat",
+                content: JSON.stringify({
+                    messages: [],
+                    title: "New AI Chat"
+                })
+            });
+
+            if (!result.note) {
+                toastService.showError("Failed to create AI Chat note");
+                return;
+            }
+
+            await appContext.tabManager.openTabWithNoteWithHoisting(result.note.noteId, {
+                activate: true
+            });
+
+            toastService.showMessage("Created new AI Chat note");
+        }
+        catch (e) {
+            console.error("Error creating AI Chat note:", e);
+            toastService.showError("Failed to create AI Chat note: " + (e as Error).message);
+        }
+    }
 }
diff --git a/src/public/app/doc_notes/en/User Guide/!!!meta.json b/src/public/app/doc_notes/en/User Guide/!!!meta.json
index d3e50116c..7bd4fbc8f 100644
--- a/src/public/app/doc_notes/en/User Guide/!!!meta.json	
+++ b/src/public/app/doc_notes/en/User Guide/!!!meta.json	
@@ -1 +1 @@
-[{"id":"_help_Otzi9La2YAUX","title":"Installation & Setup","type":"book","attributes":[{"name":"iconClass","value":"bx bx-cog","type":"label"}],"children":[{"id":"_help_poXkQfguuA0U","title":"Desktop Installation","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Desktop Installation"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_WOcw2SLH6tbX","title":"Server Installation","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_Dgg7bR3b6K9j","title":"1. Installing the server","type":"book","attributes":[{"name":"iconClass","value":"bx bx-folder","type":"label"}],"children":[{"id":"_help_3tW6mORuTHnB","title":"Packaged version for Linux","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/1. Installing the server/Packaged version for Linux"},{"name":"iconClass","value":"bx bxl-tux","type":"label"}]},{"id":"_help_rWX5eY045zbE","title":"Using Docker","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/1. Installing the server/Using Docker"},{"name":"iconClass","value":"bx bxl-docker","type":"label"}]},{"id":"_help_moVgBcoxE3EK","title":"On NixOS","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/1. Installing the server/On NixOS"},{"name":"iconClass","value":"bx bxl-tux","type":"label"}]},{"id":"_help_J1Bb6lVlwU5T","title":"Manually","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/1. Installing the server/Manually"},{"name":"iconClass","value":"bx bx-code-alt","type":"label"}]},{"id":"_help_DCmT6e7clMoP","title":"Using Kubernetes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/1. Installing the server/Using Kubernetes"},{"name":"iconClass","value":"bx bxl-kubernetes","type":"label"}]},{"id":"_help_klCWNks3ReaQ","title":"Multiple server instances","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/1. Installing the server/Multiple server instances"},{"name":"iconClass","value":"bx bxs-user-account","type":"label"}]}]},{"id":"_help_vcjrb3VVYPZI","title":"2. Reverse proxy","type":"book","attributes":[{"name":"iconClass","value":"bx bx-folder","type":"label"}],"children":[{"id":"_help_ud6MShXL4WpO","title":"Nginx","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/2. Reverse proxy/Nginx"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_fDLvzOx29Pfg","title":"Apache","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/2. Reverse proxy/Apache"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_l2VkvOwUNfZj","title":"TLS Configuration","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/TLS Configuration"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_cbkrhQjrkKrh","title":"Synchronization","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Synchronization"},{"name":"iconClass","value":"bx bx-sync","type":"label"}]},{"id":"_help_RDslemsQ6gCp","title":"Mobile Frontend","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Mobile Frontend"},{"name":"iconClass","value":"bx bx-mobile-alt","type":"label"}]},{"id":"_help_MtPxeAWVAzMg","title":"Web Clipper","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Web Clipper"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_n1lujUxCwipy","title":"Upgrading TriliumNext","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Upgrading TriliumNext"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_ODY7qQn5m2FT","title":"Backup","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Backup"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_tAassRL4RSQL","title":"Data directory","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Data directory"},{"name":"iconClass","value":"bx bx-folder-open","type":"label"}]}]},{"id":"_help_gh7bpGYxajRS","title":"Basic Concepts and Features","type":"book","attributes":[{"name":"iconClass","value":"bx bx-help-circle","type":"label"}],"children":[{"id":"_help_Vc8PjrjAGuOp","title":"UI Elements","type":"book","attributes":[{"name":"iconClass","value":"bx bx-window-alt","type":"label"}],"children":[{"id":"_help_x0JgW8UqGXvq","title":"Vertical and horizontal layout","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Vertical and horizontal layout"},{"name":"iconClass","value":"bx bxs-layout","type":"label"}]},{"id":"_help_x3i7MxGccDuM","title":"Global menu","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Global menu"},{"name":"iconClass","value":"bx bx-menu","type":"label"}]},{"id":"_help_oPVyFC7WL2Lp","title":"Note Tree","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Note Tree"},{"name":"iconClass","value":"bx bxs-tree-alt","type":"label"}],"children":[{"id":"_help_YtSN43OrfzaA","title":"Note tree contextual menu","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Note Tree/Note tree contextual menu"},{"name":"iconClass","value":"bx bx-menu","type":"label"}]},{"id":"_help_yTjUdsOi4CIE","title":"Multiple selection","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Note Tree/Multiple selection"},{"name":"iconClass","value":"bx bx-list-plus","type":"label"}]}]},{"id":"_help_BlN9DFI679QC","title":"Ribbon","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Ribbon"},{"name":"iconClass","value":"bx bx-dots-horizontal","type":"label"}]},{"id":"_help_3seOhtN8uLIY","title":"Tabs","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Tabs"},{"name":"iconClass","value":"bx bx-dock-top","type":"label"}]},{"id":"_help_xYmIYSP6wE3F","title":"Launch Bar","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Launch Bar"},{"name":"iconClass","value":"bx bx-sidebar","type":"label"}]},{"id":"_help_8YBEPzcpUgxw","title":"Note buttons","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Note buttons"},{"name":"iconClass","value":"bx bx-dots-vertical-rounded","type":"label"}]},{"id":"_help_4TIF1oA4VQRO","title":"Options","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Options"},{"name":"iconClass","value":"bx bx-cog","type":"label"}]},{"id":"_help_luNhaphA37EO","title":"Split View","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Split View"},{"name":"iconClass","value":"bx bx-dock-right","type":"label"}]},{"id":"_help_XpOYSgsLkTJy","title":"Floating buttons","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Floating buttons"},{"name":"iconClass","value":"bx bx-rectangle","type":"label"}]},{"id":"_help_RnaPdbciOfeq","title":"Right Sidebar","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Right Sidebar"},{"name":"iconClass","value":"bx bxs-dock-right","type":"label"}]},{"id":"_help_r5JGHN99bVKn","title":"Recent Changes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Recent Changes"},{"name":"iconClass","value":"bx bx-history","type":"label"}]},{"id":"_help_ny318J39E5Z0","title":"Zoom","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Zoom"},{"name":"iconClass","value":"bx bx-zoom-in","type":"label"}]}]},{"id":"_help_BFs8mudNFgCS","title":"Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes"},{"name":"iconClass","value":"bx bx-notepad","type":"label"}],"children":[{"id":"_help_p9kXRFAkwN4o","title":"Note Icons","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Note Icons"},{"name":"iconClass","value":"bx bxs-grid","type":"label"}]},{"id":"_help_0vhv7lsOLy82","title":"Attachments","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Attachments"},{"name":"iconClass","value":"bx bx-paperclip","type":"label"}]},{"id":"_help_IakOLONlIfGI","title":"Cloning Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Cloning Notes"},{"name":"iconClass","value":"bx bx-duplicate","type":"label"}],"children":[{"id":"_help_TBwsyfadTA18","title":"Branch prefix","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Cloning Notes/Branch prefix"},{"name":"iconClass","value":"bx bx-rename","type":"label"}]}]},{"id":"_help_bwg0e8ewQMak","title":"Protected Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Protected Notes"},{"name":"iconClass","value":"bx bx-lock-alt","type":"label"}]},{"id":"_help_MKmLg5x6xkor","title":"Archived Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Archived Notes"},{"name":"iconClass","value":"bx bx-box","type":"label"}]},{"id":"_help_vZWERwf8U3nx","title":"Note Revisions","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Note Revisions"},{"name":"iconClass","value":"bx bx-history","type":"label"}]},{"id":"_help_aGlEvb9hyDhS","title":"Sorting Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Sorting Notes"},{"name":"iconClass","value":"bx bx-sort-up","type":"label"}]},{"id":"_help_NRnIZmSMc5sj","title":"Export as PDF","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Export as PDF"},{"name":"iconClass","value":"bx bxs-file-pdf","type":"label"}]},{"id":"_help_CoFPLs3dRlXc","title":"Read-Only Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Read-Only Notes"},{"name":"iconClass","value":"bx bx-edit-alt","type":"label"}]},{"id":"_help_0ESUbbAxVnoK","title":"Note List","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Note List"},{"name":"iconClass","value":"bx bxs-grid","type":"label"}],"children":[{"id":"_help_xWbu3jpNWapp","title":"Calendar View","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Note List/Calendar View"},{"name":"iconClass","value":"bx bx-calendar","type":"label"}]}]}]},{"id":"_help_wArbEsdSae6g","title":"Navigation","type":"book","attributes":[{"name":"iconClass","value":"bx bx-navigation","type":"label"}],"children":[{"id":"_help_kBrnXNG3Hplm","title":"Tree Concepts","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Tree Concepts"},{"name":"iconClass","value":"bx bx-pyramid","type":"label"}]},{"id":"_help_MMiBEQljMQh2","title":"Note Navigation","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Note Navigation"},{"name":"iconClass","value":"bx bxs-navigation","type":"label"}]},{"id":"_help_Ms1nauBra7gq","title":"Quick search","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Quick search"},{"name":"iconClass","value":"bx bx-search-alt-2","type":"label"}]},{"id":"_help_F1r9QtzQLZqm","title":"Jump to Note","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Jump to Note"},{"name":"iconClass","value":"bx bx-send","type":"label"}]},{"id":"_help_eIg8jdvaoNNd","title":"Search","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Search"},{"name":"iconClass","value":"bx bx-search-alt-2","type":"label"}]},{"id":"_help_u3YFHC9tQlpm","title":"Bookmarks","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Bookmarks"},{"name":"iconClass","value":"bx bx-bookmarks","type":"label"}]},{"id":"_help_OR8WJ7Iz9K4U","title":"Note Hoisting","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Note Hoisting"},{"name":"iconClass","value":"bx bxs-chevrons-up","type":"label"}]},{"id":"_help_9sRHySam5fXb","title":"Workspaces","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Workspaces"},{"name":"iconClass","value":"bx bx-door-open","type":"label"}]},{"id":"_help_xWtq5NUHOwql","title":"Similar Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Similar Notes"},{"name":"iconClass","value":"bx bx-bar-chart","type":"label"}]},{"id":"_help_McngOG2jbUWX","title":"Search in note","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Search in note"},{"name":"iconClass","value":"bx bx-search-alt-2","type":"label"}]}]},{"id":"_help_A9Oc6YKKc65v","title":"Keyboard Shortcuts","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Keyboard Shortcuts"},{"name":"iconClass","value":"bx bxs-keyboard","type":"label"}]},{"id":"_help_Wy267RK4M69c","title":"Themes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Themes"},{"name":"iconClass","value":"bx bx-palette","type":"label"}],"children":[{"id":"_help_VbjZvtUek0Ln","title":"Theme Gallery","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Themes/Theme Gallery"},{"name":"iconClass","value":"bx bx-book-reader","type":"label"}]}]},{"id":"_help_mHbBMPDPkVV5","title":"Import & Export","type":"book","attributes":[{"name":"iconClass","value":"bx bx-import","type":"label"}],"children":[{"id":"_help_Oau6X9rCuegd","title":"Markdown","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Import & Export/Markdown"},{"name":"iconClass","value":"bx bxl-markdown","type":"label"}]},{"id":"_help_syuSEKf2rUGr","title":"Evernote","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Import & Export/Evernote"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_GnhlmrATVqcH","title":"OneNote","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Import & Export/OneNote"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_rC3pL2aptaRE","title":"Zen mode","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Zen mode"},{"name":"iconClass","value":"bx bxs-yin-yang","type":"label"}]}]},{"id":"_help_s3YCWHBfmYuM","title":"Quick Start","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Quick Start"},{"name":"iconClass","value":"bx bx-run","type":"label"}]},{"id":"_help_i6dbnitykE5D","title":"FAQ","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/FAQ"},{"name":"iconClass","value":"bx bx-question-mark","type":"label"}]},{"id":"_help_KSZ04uQ2D1St","title":"Note Types","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types"},{"name":"iconClass","value":"bx bx-edit","type":"label"}],"children":[{"id":"_help_iPIMuisry3hd","title":"Text","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text"},{"name":"iconClass","value":"bx bx-note","type":"label"}],"children":[{"id":"_help_NwBbFdNZ9h7O","title":"Block quotes & admonitions","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Block quotes & admonitions"},{"name":"iconClass","value":"bx bx-info-circle","type":"label"}]},{"id":"_help_veGu4faJErEM","title":"Content language & Right-to-left support","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Content language & Right-to-le"},{"name":"iconClass","value":"bx bx-align-right","type":"label"}]},{"id":"_help_2x0ZAX9ePtzV","title":"Cut to subnote","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Cut to subnote"},{"name":"iconClass","value":"bx bx-cut","type":"label"}]},{"id":"_help_UYuUB1ZekNQU","title":"Developer-specific formatting","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Developer-specific formatting"},{"name":"iconClass","value":"bx bx-code-alt","type":"label"}],"children":[{"id":"_help_QxEyIjRBizuC","title":"Code blocks","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Developer-specific formatting/Code blocks"},{"name":"iconClass","value":"bx bx-code","type":"label"}]}]},{"id":"_help_AgjCISero73a","title":"Footnotes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Footnotes"},{"name":"iconClass","value":"bx bx-bracket","type":"label"}]},{"id":"_help_nRhnJkTT8cPs","title":"Formatting toolbar","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Formatting toolbar"},{"name":"iconClass","value":"bx bx-text","type":"label"}]},{"id":"_help_Gr6xFaF6ioJ5","title":"General formatting","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/General formatting"},{"name":"iconClass","value":"bx bx-bold","type":"label"}]},{"id":"_help_AxshuNRegLAv","title":"Highlights list","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Highlights list"},{"name":"iconClass","value":"bx bx-highlight","type":"label"}]},{"id":"_help_mT0HEkOsz6i1","title":"Images","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Images"},{"name":"iconClass","value":"bx bx-image-alt","type":"label"}],"children":[{"id":"_help_0Ofbk1aSuVRu","title":"Image references","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Images/Image references"},{"name":"iconClass","value":"bx bxs-file-image","type":"label"}]}]},{"id":"_help_nBAXQFj20hS1","title":"Include Note","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Include Note"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_CohkqWQC1iBv","title":"Insert buttons","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Insert buttons"},{"name":"iconClass","value":"bx bx-plus","type":"label"}]},{"id":"_help_oiVPnW8QfnvS","title":"Keyboard shortcuts","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Keyboard shortcuts"},{"name":"iconClass","value":"bx bxs-keyboard","type":"label"}]},{"id":"_help_QEAPj01N5f7w","title":"Links","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Links"},{"name":"iconClass","value":"bx bx-link-alt","type":"label"}]},{"id":"_help_S6Xx8QIWTV66","title":"Lists","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Lists"},{"name":"iconClass","value":"bx bx-list-ul","type":"label"}]},{"id":"_help_QrtTYPmdd1qq","title":"Markdown-like formatting","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Markdown-like formatting"},{"name":"iconClass","value":"bx bxl-markdown","type":"label"}]},{"id":"_help_YfYAtQBcfo5V","title":"Math Equations","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Math Equations"},{"name":"iconClass","value":"bx bx-math","type":"label"}]},{"id":"_help_dEHYtoWWi8ct","title":"Other features","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Other features"},{"name":"iconClass","value":"bx bxs-grid","type":"label"}]},{"id":"_help_BFvAtE74rbP6","title":"Table of contents","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Table of contents"},{"name":"iconClass","value":"bx bx-heading","type":"label"}]},{"id":"_help_NdowYOC1GFKS","title":"Tables","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Tables"},{"name":"iconClass","value":"bx bx-table","type":"label"}]}]},{"id":"_help_6f9hih2hXXZk","title":"Code","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Code"},{"name":"iconClass","value":"bx bx-code","type":"label"}]},{"id":"_help_m523cpzocqaD","title":"Saved Search","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Saved Search"},{"name":"iconClass","value":"bx bx-file-find","type":"label"}]},{"id":"_help_iRwzGnHPzonm","title":"Relation Map","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Relation Map"},{"name":"iconClass","value":"bx bxs-network-chart","type":"label"}]},{"id":"_help_bdUJEHsAPYQR","title":"Note Map","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Note Map"},{"name":"iconClass","value":"bx bxs-network-chart","type":"label"}]},{"id":"_help_HcABDtFCkbFN","title":"Render Note","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Render Note"},{"name":"iconClass","value":"bx bx-extension","type":"label"}]},{"id":"_help_GTwFsgaA0lCt","title":"Book","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Book"},{"name":"iconClass","value":"bx bx-book","type":"label"}]},{"id":"_help_s1aBHPd79XYj","title":"Mermaid Diagrams","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Mermaid Diagrams"},{"name":"iconClass","value":"bx bx-selection","type":"label"}],"children":[{"id":"_help_RH6yLjjWJHof","title":"ELK layout","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Mermaid Diagrams/ELK layout"},{"name":"iconClass","value":"bx bxs-network-chart","type":"label"}]}]},{"id":"_help_grjYqerjn243","title":"Canvas","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Canvas"},{"name":"iconClass","value":"bx bx-pen","type":"label"}]},{"id":"_help_1vHRoWCEjj0L","title":"Web View","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Web View"},{"name":"iconClass","value":"bx bx-globe-alt","type":"label"}]},{"id":"_help_gBbsAeiuUxI5","title":"Mind Map","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Mind Map"},{"name":"iconClass","value":"bx bx-sitemap","type":"label"}]},{"id":"_help_81SGnPGMk7Xc","title":"Geo Map","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Geo Map"},{"name":"iconClass","value":"bx bx-map-alt","type":"label"}]},{"id":"_help_W8vYD3Q1zjCR","title":"File","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/File"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_BgmBlOIl72jZ","title":"Troubleshooting","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Troubleshooting"},{"name":"iconClass","value":"bx bx-bug","type":"label"}],"children":[{"id":"_help_wy8So3yZZlH9","title":"Reporting issues","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Troubleshooting/Reporting issues"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_x59R8J8KV5Bp","title":"Anonymized Database","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Troubleshooting/Anonymized Database"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_qzNzp9LYQyPT","title":"Error logs","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Troubleshooting/Error logs"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_vdlYGAcpXAgc","title":"Synchronization fails with 504 Gateway Timeout","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Troubleshooting/Synchronization fails with 504"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_s8alTXmpFR61","title":"Refreshing the application","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Troubleshooting/Refreshing the application"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_pKK96zzmvBGf","title":"Theme development","type":"book","attributes":[{"name":"iconClass","value":"bx bx-palette","type":"label"}],"children":[{"id":"_help_7NfNr5pZpVKV","title":"Creating a custom theme","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Theme development/Creating a custom theme"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_WFGzWeUK6arS","title":"Customize the Next theme","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Theme development/Customize the Next theme"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_WN5z4M8ASACJ","title":"Reference","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Theme development/Reference"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_AlhDUqhENtH7","title":"Custom app-wide CSS","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Theme development/Custom app-wide CSS"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_tC7s2alapj8V","title":"Advanced Usage","type":"book","attributes":[{"name":"iconClass","value":"bx bx-rocket","type":"label"}],"children":[{"id":"_help_zEY4DaJG4YT5","title":"Attributes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Attributes"},{"name":"iconClass","value":"bx bx-list-check","type":"label"}],"children":[{"id":"_help_HI6GBBIduIgv","title":"Labels","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Attributes/Labels"},{"name":"iconClass","value":"bx bx-hash","type":"label"}]},{"id":"_help_Cq5X6iKQop6R","title":"Relations","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Attributes/Relations"},{"name":"iconClass","value":"bx bx-transfer","type":"label"}]},{"id":"_help_bwZpz2ajCEwO","title":"Attribute Inheritance","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Attributes/Attribute Inheritance"},{"name":"iconClass","value":"bx bx-list-plus","type":"label"}]},{"id":"_help_OFXdgB2nNk1F","title":"Promoted Attributes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Attributes/Promoted Attributes"},{"name":"iconClass","value":"bx bx-table","type":"label"}]}]},{"id":"_help_KC1HB96bqqHX","title":"Templates","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Templates"},{"name":"iconClass","value":"bx bx-copy","type":"label"}]},{"id":"_help_BCkXAVs63Ttv","title":"Note Map (Link map, Tree map)","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Note Map (Link map, Tree map)"},{"name":"iconClass","value":"bx bxs-network-chart","type":"label"}]},{"id":"_help_R9pX4DGra2Vt","title":"Sharing","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Sharing"},{"name":"iconClass","value":"bx bx-share-alt","type":"label"}],"children":[{"id":"_help_Qjt68inQ2bRj","title":"Serving directly the content of a note","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Sharing/Serving directly the content o"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_5668rwcirq1t","title":"Advanced Showcases","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Advanced Showcases"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_l0tKav7yLHGF","title":"Day Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Advanced Showcases/Day Notes"},{"name":"iconClass","value":"bx bx-calendar","type":"label"}]},{"id":"_help_R7abl2fc6Mxi","title":"Weight Tracker","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Advanced Showcases/Weight Tracker"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_xYjQUYhpbUEW","title":"Task Manager","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Advanced Showcases/Task Manager"},{"name":"iconClass","value":"bx bx-calendar-check","type":"label"}]}]},{"id":"_help_J5Ex1ZrMbyJ6","title":"Custom Request Handler","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Custom Request Handler"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_d3fAXQ2diepH","title":"Custom Resource Providers","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Custom Resource Providers"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_pgxEVkzLl1OP","title":"ETAPI (REST API)","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/ETAPI (REST API)"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_9qPsTWBorUhQ","title":"API Reference","type":"webView","attributes":[{"type":"label","name":"webViewSrc","value":"/etapi/docs"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_47ZrP6FNuoG8","title":"Default Note Title","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Default Note Title"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_wX4HbRucYSDD","title":"Database","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Database"},{"name":"iconClass","value":"bx bx-data","type":"label"}],"children":[{"id":"_help_oyIAJ9PvvwHX","title":"Manually altering the database","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Database/Manually altering the database"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_YKWqdJhzi2VY","title":"SQL Console","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Database/Manually altering the database/SQL Console"},{"name":"iconClass","value":"bx bx-data","type":"label"}]}]},{"id":"_help_6tZeKvSHEUiB","title":"Demo Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Database/Demo Notes"},{"name":"iconClass","value":"bx bx-package","type":"label"}]}]},{"id":"_help_Gzjqa934BdH4","title":"Configuration (config.ini or environment variables)","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Configuration (config.ini or e"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_c5xB8m4g2IY6","title":"Trilium instance","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Configuration (config.ini or environment variables)/Trilium instance"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_LWtBjFej3wX3","title":"Cross-Origin Resource Sharing (CORS)","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Configuration (config.ini or environment variables)/Cross-Origin Resource Sharing "},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_ivYnonVFBxbQ","title":"Bulk Actions","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Bulk Actions"},{"name":"iconClass","value":"bx bx-list-plus","type":"label"}]},{"id":"_help_4FahAwuGTAwC","title":"Note source","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Note source"},{"name":"iconClass","value":"bx bx-code","type":"label"}]},{"id":"_help_1YeN2MzFUluU","title":"Technologies used","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Technologies used"},{"name":"iconClass","value":"bx bxs-component","type":"label"}],"children":[{"id":"_help_MI26XDLSAlCD","title":"CKEditor","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Technologies used/CKEditor"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_N4IDkixaDG9C","title":"MindElixir","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Technologies used/MindElixir"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_H0mM1lTxF9JI","title":"Excalidraw","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Technologies used/Excalidraw"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_MQHyy2dIFgxS","title":"Leaflet","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Technologies used/Leaflet"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_m1lbrzyKDaRB","title":"Note ID","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Note ID"},{"name":"iconClass","value":"bx bx-hash","type":"label"}]},{"id":"_help_0vTSyvhPTAOz","title":"Internal API","type":"book","attributes":[{"name":"iconClass","value":"bx bx-folder","type":"label"}],"children":[{"id":"_help_z8O2VG4ZZJD7","title":"API Reference","type":"webView","attributes":[{"type":"label","name":"webViewSrc","value":"/api/docs"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_2mUhVmZK8RF3","title":"Hidden Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Hidden Notes"},{"name":"iconClass","value":"bx bx-hide","type":"label"}]}]},{"id":"_help_CdNpE2pqjmI6","title":"Scripting","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting"},{"name":"iconClass","value":"bx bxs-file-js","type":"label"}],"children":[{"id":"_help_yIhgI5H7A2Sm","title":"Frontend Basics","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Frontend Basics"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_es8OU2GuguFU","title":"Examples","type":"book","attributes":[{"name":"iconClass","value":"bx bx-folder","type":"label"}],"children":[{"id":"_help_TjLYAo3JMO8X","title":"\"New Task\" launcher button","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Examples/New Task launcher button"},{"name":"iconClass","value":"bx bx-task","type":"label"}]},{"id":"_help_7kZPMD0uFwkH","title":"Downloading responses from Google Forms","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Examples/Downloading responses from Goo"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_DL92EjAaXT26","title":"Using promoted attributes to configure scripts","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Examples/Using promoted attributes to c"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_GPERMystNGTB","title":"Events","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Events"},{"name":"iconClass","value":"bx bx-rss","type":"label"}]},{"id":"_help_MgibgPcfeuGz","title":"Custom Widgets","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Custom Widgets"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_YNxAqkI5Kg1M","title":"Word count widget","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Custom Widgets/Word count widget"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_SynTBQiBsdYJ","title":"Widget Basics","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Custom Widgets/Widget Basics"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_GLks18SNjxmC","title":"Script API","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Script API"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_Q2z6av6JZVWm","title":"Frontend API","type":"webView","attributes":[{"type":"label","name":"webViewSrc","value":"https://triliumnext.github.io/Notes/Script%20API/interfaces/Frontend_Script_API.Api.html"},{"name":"iconClass","value":"bx bx-folder","type":"label"}],"children":[{"id":"_help_habiZ3HU8Kw8","title":"FNote","type":"webView","attributes":[{"type":"label","name":"webViewSrc","value":"https://triliumnext.github.io/Notes/Script%20API/classes/Frontend_Script_API.FNote.html"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_MEtfsqa5VwNi","title":"Backend API","type":"webView","attributes":[{"type":"label","name":"webViewSrc","value":"https://triliumnext.github.io/Notes/Script%20API/interfaces/Backend_Script_API.Api.html"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]}]}]
\ No newline at end of file
+[{"id":"_help_Otzi9La2YAUX","title":"Installation & Setup","type":"book","attributes":[{"name":"iconClass","value":"bx bx-cog","type":"label"}],"children":[{"id":"_help_poXkQfguuA0U","title":"Desktop Installation","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Desktop Installation"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_WOcw2SLH6tbX","title":"Server Installation","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_Dgg7bR3b6K9j","title":"1. Installing the server","type":"book","attributes":[{"name":"iconClass","value":"bx bx-folder","type":"label"}],"children":[{"id":"_help_3tW6mORuTHnB","title":"Packaged version for Linux","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/1. Installing the server/Packaged version for Linux"},{"name":"iconClass","value":"bx bxl-tux","type":"label"}]},{"id":"_help_rWX5eY045zbE","title":"Using Docker","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/1. Installing the server/Using Docker"},{"name":"iconClass","value":"bx bxl-docker","type":"label"}]},{"id":"_help_moVgBcoxE3EK","title":"On NixOS","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/1. Installing the server/On NixOS"},{"name":"iconClass","value":"bx bxl-tux","type":"label"}]},{"id":"_help_J1Bb6lVlwU5T","title":"Manually","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/1. Installing the server/Manually"},{"name":"iconClass","value":"bx bx-code-alt","type":"label"}]},{"id":"_help_DCmT6e7clMoP","title":"Using Kubernetes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/1. Installing the server/Using Kubernetes"},{"name":"iconClass","value":"bx bxl-kubernetes","type":"label"}]},{"id":"_help_klCWNks3ReaQ","title":"Multiple server instances","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/1. Installing the server/Multiple server instances"},{"name":"iconClass","value":"bx bxs-user-account","type":"label"}]}]},{"id":"_help_vcjrb3VVYPZI","title":"2. Reverse proxy","type":"book","attributes":[{"name":"iconClass","value":"bx bx-folder","type":"label"}],"children":[{"id":"_help_ud6MShXL4WpO","title":"Nginx","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/2. Reverse proxy/Nginx"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_fDLvzOx29Pfg","title":"Apache","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/2. Reverse proxy/Apache"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_l2VkvOwUNfZj","title":"TLS Configuration","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Server Installation/TLS Configuration"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_cbkrhQjrkKrh","title":"Synchronization","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Synchronization"},{"name":"iconClass","value":"bx bx-sync","type":"label"}]},{"id":"_help_RDslemsQ6gCp","title":"Mobile Frontend","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Mobile Frontend"},{"name":"iconClass","value":"bx bx-mobile-alt","type":"label"}]},{"id":"_help_MtPxeAWVAzMg","title":"Web Clipper","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Web Clipper"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_n1lujUxCwipy","title":"Upgrading TriliumNext","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Upgrading TriliumNext"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_ODY7qQn5m2FT","title":"Backup","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Backup"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_tAassRL4RSQL","title":"Data directory","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Installation & Setup/Data directory"},{"name":"iconClass","value":"bx bx-folder-open","type":"label"}]}]},{"id":"_help_gh7bpGYxajRS","title":"Basic Concepts and Features","type":"book","attributes":[{"name":"iconClass","value":"bx bx-help-circle","type":"label"}],"children":[{"id":"_help_Vc8PjrjAGuOp","title":"UI Elements","type":"book","attributes":[{"name":"iconClass","value":"bx bx-window-alt","type":"label"}],"children":[{"id":"_help_x0JgW8UqGXvq","title":"Vertical and horizontal layout","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Vertical and horizontal layout"},{"name":"iconClass","value":"bx bxs-layout","type":"label"}]},{"id":"_help_x3i7MxGccDuM","title":"Global menu","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Global menu"},{"name":"iconClass","value":"bx bx-menu","type":"label"}]},{"id":"_help_oPVyFC7WL2Lp","title":"Note Tree","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Note Tree"},{"name":"iconClass","value":"bx bxs-tree-alt","type":"label"}],"children":[{"id":"_help_YtSN43OrfzaA","title":"Note tree contextual menu","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Note Tree/Note tree contextual menu"},{"name":"iconClass","value":"bx bx-menu","type":"label"}]},{"id":"_help_yTjUdsOi4CIE","title":"Multiple selection","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Note Tree/Multiple selection"},{"name":"iconClass","value":"bx bx-list-plus","type":"label"}]}]},{"id":"_help_BlN9DFI679QC","title":"Ribbon","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Ribbon"},{"name":"iconClass","value":"bx bx-dots-horizontal","type":"label"}]},{"id":"_help_3seOhtN8uLIY","title":"Tabs","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Tabs"},{"name":"iconClass","value":"bx bx-dock-top","type":"label"}]},{"id":"_help_xYmIYSP6wE3F","title":"Launch Bar","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Launch Bar"},{"name":"iconClass","value":"bx bx-sidebar","type":"label"}]},{"id":"_help_8YBEPzcpUgxw","title":"Note buttons","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Note buttons"},{"name":"iconClass","value":"bx bx-dots-vertical-rounded","type":"label"}]},{"id":"_help_4TIF1oA4VQRO","title":"Options","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Options"},{"name":"iconClass","value":"bx bx-cog","type":"label"}]},{"id":"_help_luNhaphA37EO","title":"Split View","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Split View"},{"name":"iconClass","value":"bx bx-dock-right","type":"label"}]},{"id":"_help_XpOYSgsLkTJy","title":"Floating buttons","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Floating buttons"},{"name":"iconClass","value":"bx bx-rectangle","type":"label"}]},{"id":"_help_RnaPdbciOfeq","title":"Right Sidebar","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Right Sidebar"},{"name":"iconClass","value":"bx bxs-dock-right","type":"label"}]},{"id":"_help_r5JGHN99bVKn","title":"Recent Changes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Recent Changes"},{"name":"iconClass","value":"bx bx-history","type":"label"}]},{"id":"_help_ny318J39E5Z0","title":"Zoom","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/UI Elements/Zoom"},{"name":"iconClass","value":"bx bx-zoom-in","type":"label"}]}]},{"id":"_help_BFs8mudNFgCS","title":"Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes"},{"name":"iconClass","value":"bx bx-notepad","type":"label"}],"children":[{"id":"_help_p9kXRFAkwN4o","title":"Note Icons","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Note Icons"},{"name":"iconClass","value":"bx bxs-grid","type":"label"}]},{"id":"_help_0vhv7lsOLy82","title":"Attachments","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Attachments"},{"name":"iconClass","value":"bx bx-paperclip","type":"label"}]},{"id":"_help_IakOLONlIfGI","title":"Cloning Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Cloning Notes"},{"name":"iconClass","value":"bx bx-duplicate","type":"label"}],"children":[{"id":"_help_TBwsyfadTA18","title":"Branch prefix","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Cloning Notes/Branch prefix"},{"name":"iconClass","value":"bx bx-rename","type":"label"}]}]},{"id":"_help_bwg0e8ewQMak","title":"Protected Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Protected Notes"},{"name":"iconClass","value":"bx bx-lock-alt","type":"label"}]},{"id":"_help_MKmLg5x6xkor","title":"Archived Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Archived Notes"},{"name":"iconClass","value":"bx bx-box","type":"label"}]},{"id":"_help_vZWERwf8U3nx","title":"Note Revisions","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Note Revisions"},{"name":"iconClass","value":"bx bx-history","type":"label"}]},{"id":"_help_aGlEvb9hyDhS","title":"Sorting Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Sorting Notes"},{"name":"iconClass","value":"bx bx-sort-up","type":"label"}]},{"id":"_help_NRnIZmSMc5sj","title":"Export as PDF","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Export as PDF"},{"name":"iconClass","value":"bx bxs-file-pdf","type":"label"}]},{"id":"_help_CoFPLs3dRlXc","title":"Read-Only Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Read-Only Notes"},{"name":"iconClass","value":"bx bx-edit-alt","type":"label"}]},{"id":"_help_0ESUbbAxVnoK","title":"Note List","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Note List"},{"name":"iconClass","value":"bx bxs-grid","type":"label"}],"children":[{"id":"_help_xWbu3jpNWapp","title":"Calendar View","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Notes/Note List/Calendar View"},{"name":"iconClass","value":"bx bx-calendar","type":"label"}]}]}]},{"id":"_help_wArbEsdSae6g","title":"Navigation","type":"book","attributes":[{"name":"iconClass","value":"bx bx-navigation","type":"label"}],"children":[{"id":"_help_kBrnXNG3Hplm","title":"Tree Concepts","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Tree Concepts"},{"name":"iconClass","value":"bx bx-pyramid","type":"label"}]},{"id":"_help_MMiBEQljMQh2","title":"Note Navigation","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Note Navigation"},{"name":"iconClass","value":"bx bxs-navigation","type":"label"}]},{"id":"_help_Ms1nauBra7gq","title":"Quick search","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Quick search"},{"name":"iconClass","value":"bx bx-search-alt-2","type":"label"}]},{"id":"_help_F1r9QtzQLZqm","title":"Jump to Note","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Jump to Note"},{"name":"iconClass","value":"bx bx-send","type":"label"}]},{"id":"_help_eIg8jdvaoNNd","title":"Search","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Search"},{"name":"iconClass","value":"bx bx-search-alt-2","type":"label"}]},{"id":"_help_u3YFHC9tQlpm","title":"Bookmarks","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Bookmarks"},{"name":"iconClass","value":"bx bx-bookmarks","type":"label"}]},{"id":"_help_OR8WJ7Iz9K4U","title":"Note Hoisting","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Note Hoisting"},{"name":"iconClass","value":"bx bxs-chevrons-up","type":"label"}]},{"id":"_help_9sRHySam5fXb","title":"Workspaces","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Workspaces"},{"name":"iconClass","value":"bx bx-door-open","type":"label"}]},{"id":"_help_xWtq5NUHOwql","title":"Similar Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Similar Notes"},{"name":"iconClass","value":"bx bx-bar-chart","type":"label"}]},{"id":"_help_McngOG2jbUWX","title":"Search in note","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Navigation/Search in note"},{"name":"iconClass","value":"bx bx-search-alt-2","type":"label"}]}]},{"id":"_help_A9Oc6YKKc65v","title":"Keyboard Shortcuts","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Keyboard Shortcuts"},{"name":"iconClass","value":"bx bxs-keyboard","type":"label"}]},{"id":"_help_Wy267RK4M69c","title":"Themes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Themes"},{"name":"iconClass","value":"bx bx-palette","type":"label"}],"children":[{"id":"_help_VbjZvtUek0Ln","title":"Theme Gallery","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Themes/Theme Gallery"},{"name":"iconClass","value":"bx bx-book-reader","type":"label"}]}]},{"id":"_help_mHbBMPDPkVV5","title":"Import & Export","type":"book","attributes":[{"name":"iconClass","value":"bx bx-import","type":"label"}],"children":[{"id":"_help_Oau6X9rCuegd","title":"Markdown","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Import & Export/Markdown"},{"name":"iconClass","value":"bx bxl-markdown","type":"label"}]},{"id":"_help_syuSEKf2rUGr","title":"Evernote","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Import & Export/Evernote"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_GnhlmrATVqcH","title":"OneNote","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Import & Export/OneNote"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_rC3pL2aptaRE","title":"Zen mode","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Basic Concepts and Features/Zen mode"},{"name":"iconClass","value":"bx bxs-yin-yang","type":"label"}]}]},{"id":"_help_s3YCWHBfmYuM","title":"Quick Start","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Quick Start"},{"name":"iconClass","value":"bx bx-run","type":"label"}]},{"id":"_help_i6dbnitykE5D","title":"FAQ","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/FAQ"},{"name":"iconClass","value":"bx bx-question-mark","type":"label"}]},{"id":"_help_KSZ04uQ2D1St","title":"Note Types","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types"},{"name":"iconClass","value":"bx bx-edit","type":"label"}],"children":[{"id":"_help_iPIMuisry3hd","title":"Text","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text"},{"name":"iconClass","value":"bx bx-note","type":"label"}],"children":[{"id":"_help_NwBbFdNZ9h7O","title":"Block quotes & admonitions","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Block quotes & admonitions"},{"name":"iconClass","value":"bx bx-info-circle","type":"label"}]},{"id":"_help_veGu4faJErEM","title":"Content language & Right-to-left support","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Content language & Right-to-le"},{"name":"iconClass","value":"bx bx-align-right","type":"label"}]},{"id":"_help_2x0ZAX9ePtzV","title":"Cut to subnote","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Cut to subnote"},{"name":"iconClass","value":"bx bx-cut","type":"label"}]},{"id":"_help_UYuUB1ZekNQU","title":"Developer-specific formatting","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Developer-specific formatting"},{"name":"iconClass","value":"bx bx-code-alt","type":"label"}],"children":[{"id":"_help_QxEyIjRBizuC","title":"Code blocks","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Developer-specific formatting/Code blocks"},{"name":"iconClass","value":"bx bx-code","type":"label"}]}]},{"id":"_help_AgjCISero73a","title":"Footnotes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Footnotes"},{"name":"iconClass","value":"bx bx-bracket","type":"label"}]},{"id":"_help_nRhnJkTT8cPs","title":"Formatting toolbar","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Formatting toolbar"},{"name":"iconClass","value":"bx bx-text","type":"label"}]},{"id":"_help_Gr6xFaF6ioJ5","title":"General formatting","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/General formatting"},{"name":"iconClass","value":"bx bx-bold","type":"label"}]},{"id":"_help_AxshuNRegLAv","title":"Highlights list","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Highlights list"},{"name":"iconClass","value":"bx bx-highlight","type":"label"}]},{"id":"_help_mT0HEkOsz6i1","title":"Images","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Images"},{"name":"iconClass","value":"bx bx-image-alt","type":"label"}],"children":[{"id":"_help_0Ofbk1aSuVRu","title":"Image references","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Images/Image references"},{"name":"iconClass","value":"bx bxs-file-image","type":"label"}]}]},{"id":"_help_nBAXQFj20hS1","title":"Include Note","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Include Note"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_CohkqWQC1iBv","title":"Insert buttons","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Insert buttons"},{"name":"iconClass","value":"bx bx-plus","type":"label"}]},{"id":"_help_oiVPnW8QfnvS","title":"Keyboard shortcuts","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Keyboard shortcuts"},{"name":"iconClass","value":"bx bxs-keyboard","type":"label"}]},{"id":"_help_QEAPj01N5f7w","title":"Links","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Links"},{"name":"iconClass","value":"bx bx-link-alt","type":"label"}]},{"id":"_help_S6Xx8QIWTV66","title":"Lists","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Lists"},{"name":"iconClass","value":"bx bx-list-ul","type":"label"}]},{"id":"_help_QrtTYPmdd1qq","title":"Markdown-like formatting","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Markdown-like formatting"},{"name":"iconClass","value":"bx bxl-markdown","type":"label"}]},{"id":"_help_YfYAtQBcfo5V","title":"Math Equations","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Math Equations"},{"name":"iconClass","value":"bx bx-math","type":"label"}]},{"id":"_help_dEHYtoWWi8ct","title":"Other features","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Other features"},{"name":"iconClass","value":"bx bxs-grid","type":"label"}]},{"id":"_help_BFvAtE74rbP6","title":"Table of contents","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Table of contents"},{"name":"iconClass","value":"bx bx-heading","type":"label"}]},{"id":"_help_NdowYOC1GFKS","title":"Tables","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Text/Tables"},{"name":"iconClass","value":"bx bx-table","type":"label"}]}]},{"id":"_help_6f9hih2hXXZk","title":"Code","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Code"},{"name":"iconClass","value":"bx bx-code","type":"label"}]},{"id":"_help_m523cpzocqaD","title":"Saved Search","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Saved Search"},{"name":"iconClass","value":"bx bx-file-find","type":"label"}]},{"id":"_help_iRwzGnHPzonm","title":"Relation Map","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Relation Map"},{"name":"iconClass","value":"bx bxs-network-chart","type":"label"}]},{"id":"_help_bdUJEHsAPYQR","title":"Note Map","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Note Map"},{"name":"iconClass","value":"bx bxs-network-chart","type":"label"}]},{"id":"_help_HcABDtFCkbFN","title":"Render Note","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Render Note"},{"name":"iconClass","value":"bx bx-extension","type":"label"}]},{"id":"_help_GTwFsgaA0lCt","title":"Book","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Book"},{"name":"iconClass","value":"bx bx-book","type":"label"}]},{"id":"_help_s1aBHPd79XYj","title":"Mermaid Diagrams","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Mermaid Diagrams"},{"name":"iconClass","value":"bx bx-selection","type":"label"}],"children":[{"id":"_help_RH6yLjjWJHof","title":"ELK layout","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Mermaid Diagrams/ELK layout"},{"name":"iconClass","value":"bx bxs-network-chart","type":"label"}]}]},{"id":"_help_grjYqerjn243","title":"Canvas","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Canvas"},{"name":"iconClass","value":"bx bx-pen","type":"label"}]},{"id":"_help_1vHRoWCEjj0L","title":"Web View","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Web View"},{"name":"iconClass","value":"bx bx-globe-alt","type":"label"}]},{"id":"_help_gBbsAeiuUxI5","title":"Mind Map","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Mind Map"},{"name":"iconClass","value":"bx bx-sitemap","type":"label"}]},{"id":"_help_81SGnPGMk7Xc","title":"Geo Map","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/Geo Map"},{"name":"iconClass","value":"bx bx-map-alt","type":"label"}]},{"id":"_help_W8vYD3Q1zjCR","title":"File","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Note Types/File"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_BgmBlOIl72jZ","title":"Troubleshooting","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Troubleshooting"},{"name":"iconClass","value":"bx bx-bug","type":"label"}],"children":[{"id":"_help_wy8So3yZZlH9","title":"Reporting issues","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Troubleshooting/Reporting issues"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_x59R8J8KV5Bp","title":"Anonymized Database","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Troubleshooting/Anonymized Database"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_qzNzp9LYQyPT","title":"Error logs","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Troubleshooting/Error logs"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_vdlYGAcpXAgc","title":"Synchronization fails with 504 Gateway Timeout","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Troubleshooting/Synchronization fails with 504"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_s8alTXmpFR61","title":"Refreshing the application","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Troubleshooting/Refreshing the application"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_pKK96zzmvBGf","title":"Theme development","type":"book","attributes":[{"name":"iconClass","value":"bx bx-palette","type":"label"}],"children":[{"id":"_help_7NfNr5pZpVKV","title":"Creating a custom theme","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Theme development/Creating a custom theme"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_WFGzWeUK6arS","title":"Customize the Next theme","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Theme development/Customize the Next theme"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_WN5z4M8ASACJ","title":"Reference","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Theme development/Reference"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_AlhDUqhENtH7","title":"Custom app-wide CSS","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Theme development/Custom app-wide CSS"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_tC7s2alapj8V","title":"Advanced Usage","type":"book","attributes":[{"name":"iconClass","value":"bx bx-rocket","type":"label"}],"children":[{"id":"_help_zEY4DaJG4YT5","title":"Attributes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Attributes"},{"name":"iconClass","value":"bx bx-list-check","type":"label"}],"children":[{"id":"_help_HI6GBBIduIgv","title":"Labels","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Attributes/Labels"},{"name":"iconClass","value":"bx bx-hash","type":"label"}]},{"id":"_help_Cq5X6iKQop6R","title":"Relations","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Attributes/Relations"},{"name":"iconClass","value":"bx bx-transfer","type":"label"}]},{"id":"_help_bwZpz2ajCEwO","title":"Attribute Inheritance","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Attributes/Attribute Inheritance"},{"name":"iconClass","value":"bx bx-list-plus","type":"label"}]},{"id":"_help_OFXdgB2nNk1F","title":"Promoted Attributes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Attributes/Promoted Attributes"},{"name":"iconClass","value":"bx bx-table","type":"label"}]}]},{"id":"_help_KC1HB96bqqHX","title":"Templates","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Templates"},{"name":"iconClass","value":"bx bx-copy","type":"label"}]},{"id":"_help_BCkXAVs63Ttv","title":"Note Map (Link map, Tree map)","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Note Map (Link map, Tree map)"},{"name":"iconClass","value":"bx bxs-network-chart","type":"label"}]},{"id":"_help_R9pX4DGra2Vt","title":"Sharing","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Sharing"},{"name":"iconClass","value":"bx bx-share-alt","type":"label"}],"children":[{"id":"_help_Qjt68inQ2bRj","title":"Serving directly the content of a note","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Sharing/Serving directly the content o"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_5668rwcirq1t","title":"Advanced Showcases","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Advanced Showcases"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_l0tKav7yLHGF","title":"Day Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Advanced Showcases/Day Notes"},{"name":"iconClass","value":"bx bx-calendar","type":"label"}]},{"id":"_help_R7abl2fc6Mxi","title":"Weight Tracker","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Advanced Showcases/Weight Tracker"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_xYjQUYhpbUEW","title":"Task Manager","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Advanced Showcases/Task Manager"},{"name":"iconClass","value":"bx bx-calendar-check","type":"label"}]}]},{"id":"_help_J5Ex1ZrMbyJ6","title":"Custom Request Handler","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Custom Request Handler"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_d3fAXQ2diepH","title":"Custom Resource Providers","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Custom Resource Providers"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_pgxEVkzLl1OP","title":"ETAPI (REST API)","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/ETAPI (REST API)"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_9qPsTWBorUhQ","title":"API Reference","type":"webView","attributes":[{"type":"label","name":"webViewSrc","value":"/etapi/docs"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_47ZrP6FNuoG8","title":"Default Note Title","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Default Note Title"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_wX4HbRucYSDD","title":"Database","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Database"},{"name":"iconClass","value":"bx bx-data","type":"label"}],"children":[{"id":"_help_oyIAJ9PvvwHX","title":"Manually altering the database","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Database/Manually altering the database"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_YKWqdJhzi2VY","title":"SQL Console","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Database/Manually altering the database/SQL Console"},{"name":"iconClass","value":"bx bx-data","type":"label"}]}]},{"id":"_help_6tZeKvSHEUiB","title":"Demo Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Database/Demo Notes"},{"name":"iconClass","value":"bx bx-package","type":"label"}]}]},{"id":"_help_Gzjqa934BdH4","title":"Configuration (config.ini or environment variables)","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Configuration (config.ini or e"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_c5xB8m4g2IY6","title":"Trilium instance","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Configuration (config.ini or environment variables)/Trilium instance"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_LWtBjFej3wX3","title":"Cross-Origin Resource Sharing (CORS)","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Configuration (config.ini or environment variables)/Cross-Origin Resource Sharing "},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_ivYnonVFBxbQ","title":"Bulk Actions","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Bulk Actions"},{"name":"iconClass","value":"bx bx-list-plus","type":"label"}]},{"id":"_help_4FahAwuGTAwC","title":"Note source","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Note source"},{"name":"iconClass","value":"bx bx-code","type":"label"}]},{"id":"_help_1YeN2MzFUluU","title":"Technologies used","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Technologies used"},{"name":"iconClass","value":"bx bxs-component","type":"label"}],"children":[{"id":"_help_MI26XDLSAlCD","title":"CKEditor","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Technologies used/CKEditor"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_N4IDkixaDG9C","title":"MindElixir","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Technologies used/MindElixir"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_H0mM1lTxF9JI","title":"Excalidraw","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Technologies used/Excalidraw"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_MQHyy2dIFgxS","title":"Leaflet","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Technologies used/Leaflet"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_m1lbrzyKDaRB","title":"Note ID","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Note ID"},{"name":"iconClass","value":"bx bx-hash","type":"label"}]},{"id":"_help_0vTSyvhPTAOz","title":"Internal API","type":"book","attributes":[{"name":"iconClass","value":"bx bx-folder","type":"label"}],"children":[{"id":"_help_z8O2VG4ZZJD7","title":"API Reference","type":"webView","attributes":[{"type":"label","name":"webViewSrc","value":"/api/docs"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_2mUhVmZK8RF3","title":"Hidden Notes","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Advanced Usage/Hidden Notes"},{"name":"iconClass","value":"bx bx-hide","type":"label"}]}]},{"id":"_help_LMAv4Uy3Wk6J","title":"AI","type":"book","attributes":[{"name":"iconClass","value":"bx bx-bot","type":"label"}],"children":[{"id":"_help_GBBMSlVSOIGP","title":"Introduction","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/AI/Introduction"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_WkM7gsEUyCXs","title":"AI Provider Information","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/AI/AI Provider Information"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_7EdTxPADv95W","title":"Ollama","type":"book","attributes":[{"name":"iconClass","value":"bx bx-folder","type":"label"}],"children":[{"id":"_help_vvUCN7FDkq7G","title":"Installing Ollama","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/AI/AI Provider Information/Ollama/Installing Ollama"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_ZavFigBX9AwP","title":"OpenAI","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/AI/AI Provider Information/OpenAI"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_e0lkirXEiSNc","title":"Anthropic","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/AI/AI Provider Information/Anthropic"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]}]},{"id":"_help_CdNpE2pqjmI6","title":"Scripting","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting"},{"name":"iconClass","value":"bx bxs-file-js","type":"label"}],"children":[{"id":"_help_yIhgI5H7A2Sm","title":"Frontend Basics","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Frontend Basics"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_es8OU2GuguFU","title":"Examples","type":"book","attributes":[{"name":"iconClass","value":"bx bx-folder","type":"label"}],"children":[{"id":"_help_TjLYAo3JMO8X","title":"\"New Task\" launcher button","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Examples/New Task launcher button"},{"name":"iconClass","value":"bx bx-task","type":"label"}]},{"id":"_help_7kZPMD0uFwkH","title":"Downloading responses from Google Forms","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Examples/Downloading responses from Goo"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_DL92EjAaXT26","title":"Using promoted attributes to configure scripts","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Examples/Using promoted attributes to c"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_GPERMystNGTB","title":"Events","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Events"},{"name":"iconClass","value":"bx bx-rss","type":"label"}]},{"id":"_help_MgibgPcfeuGz","title":"Custom Widgets","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Custom Widgets"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_YNxAqkI5Kg1M","title":"Word count widget","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Custom Widgets/Word count widget"},{"name":"iconClass","value":"bx bx-file","type":"label"}]},{"id":"_help_SynTBQiBsdYJ","title":"Widget Basics","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Custom Widgets/Widget Basics"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_GLks18SNjxmC","title":"Script API","type":"doc","attributes":[{"type":"label","name":"docName","value":"User Guide/User Guide/Scripting/Script API"},{"name":"iconClass","value":"bx bx-file","type":"label"}],"children":[{"id":"_help_Q2z6av6JZVWm","title":"Frontend API","type":"webView","attributes":[{"type":"label","name":"webViewSrc","value":"https://triliumnext.github.io/Notes/Script%20API/interfaces/Frontend_Script_API.Api.html"},{"name":"iconClass","value":"bx bx-folder","type":"label"}],"children":[{"id":"_help_habiZ3HU8Kw8","title":"FNote","type":"webView","attributes":[{"type":"label","name":"webViewSrc","value":"https://triliumnext.github.io/Notes/Script%20API/classes/Frontend_Script_API.FNote.html"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]},{"id":"_help_MEtfsqa5VwNi","title":"Backend API","type":"webView","attributes":[{"type":"label","name":"webViewSrc","value":"https://triliumnext.github.io/Notes/Script%20API/interfaces/Backend_Script_API.Api.html"},{"name":"iconClass","value":"bx bx-file","type":"label"}]}]}]}]
\ No newline at end of file
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/1_AI Provider Information_im.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/1_AI Provider Information_im.png
new file mode 100644
index 000000000..80627e0b0
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/1_AI Provider Information_im.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/1_Introduction_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/1_Introduction_image.png
new file mode 100644
index 000000000..c0955f2bf
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/1_Introduction_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/2_Introduction_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/2_Introduction_image.png
new file mode 100644
index 000000000..3908a5f48
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/2_Introduction_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/3_Introduction_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/3_Introduction_image.png
new file mode 100644
index 000000000..0fe0c8186
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/3_Introduction_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/4_Introduction_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/4_Introduction_image.png
new file mode 100644
index 000000000..ef2ad8a0f
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/4_Introduction_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/5_Introduction_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/5_Introduction_image.png
new file mode 100644
index 000000000..ede9d6aae
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/5_Introduction_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/6_Introduction_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/6_Introduction_image.png
new file mode 100644
index 000000000..e784df790
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/6_Introduction_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/7_Introduction_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/7_Introduction_image.png
new file mode 100644
index 000000000..96d56b39c
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/7_Introduction_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/8_Introduction_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/8_Introduction_image.png
new file mode 100644
index 000000000..afb6653ca
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/8_Introduction_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/9_Introduction_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/9_Introduction_image.png
new file mode 100644
index 000000000..f50f69553
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/9_Introduction_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information.html b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information.html
new file mode 100644
index 000000000..963837bc1
--- /dev/null
+++ b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information.html	
@@ -0,0 +1,22 @@
+<p>Currently, we support the following providers:</p>
+<ul>
+  <li><a class="reference-link" href="#root/_help_7EdTxPADv95W">Ollama</a>
+  </li>
+  <li><a class="reference-link" href="#root/_help_ZavFigBX9AwP">OpenAI</a>
+  </li>
+  <li><a class="reference-link" href="#root/_help_e0lkirXEiSNc">Anthropic</a>
+  </li>
+  <li>Voyage AI</li>
+</ul>
+<p>To set your preferred chat model, you'll want to enter the provider's
+  name here:</p>
+<figure class="image image_resized" style="width:88.38%;">
+  <img style="aspect-ratio:1884/1267;" src="AI Provider Information_im.png"
+  width="1884" height="1267">
+</figure>
+<p>And to set your preferred embedding provider:</p>
+<figure class="image image_resized"
+style="width:93.47%;">
+  <img style="aspect-ratio:1907/1002;" src="1_AI Provider Information_im.png"
+  width="1907" height="1002">
+</figure>
\ No newline at end of file
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Anthropic.html b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Anthropic.html
new file mode 100644
index 000000000..e69de29bb
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/1_Installing Ollama_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/1_Installing Ollama_image.png
new file mode 100644
index 000000000..821966b77
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/1_Installing Ollama_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/2_Installing Ollama_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/2_Installing Ollama_image.png
new file mode 100644
index 000000000..7e585a751
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/2_Installing Ollama_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/3_Installing Ollama_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/3_Installing Ollama_image.png
new file mode 100644
index 000000000..0a239f35c
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/3_Installing Ollama_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/4_Installing Ollama_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/4_Installing Ollama_image.png
new file mode 100644
index 000000000..b5c4c2930
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/4_Installing Ollama_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/5_Installing Ollama_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/5_Installing Ollama_image.png
new file mode 100644
index 000000000..0c02db50f
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/5_Installing Ollama_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/Installing Ollama.html b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/Installing Ollama.html
new file mode 100644
index 000000000..39d9ee00d
--- /dev/null
+++ b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/Installing Ollama.html	
@@ -0,0 +1,45 @@
+<p><a href="https://ollama.com/">Ollama</a> can be installed in a variety
+  of ways, and even runs <a href="https://hub.docker.com/r/ollama/ollama">within a Docker container</a>.
+  Ollama will be noticeably quicker when running on a GPU (Nvidia, AMD, Intel),
+  but it can run on CPU and RAM. To install Ollama without any other prerequisites,
+  you can follow their <a href="https://ollama.com/download">installer</a>:</p>
+<figure
+class="image image_resized" style="width:50.49%;">
+  <img style="aspect-ratio:785/498;" src="3_Installing Ollama_image.png"
+  width="785" height="498">
+  </figure>
+  <figure class="image image_resized" style="width:40.54%;">
+    <img style="aspect-ratio:467/100;" src="Installing Ollama_image.png" width="467"
+    height="100">
+  </figure>
+  <figure class="image image_resized" style="width:55.73%;">
+    <img style="aspect-ratio:1296/1011;" src="1_Installing Ollama_image.png"
+    width="1296" height="1011">
+  </figure>
+  <p>After their installer completes, if you're on Windows, you should see
+    an entry in the start menu to run it:</p>
+  <figure class="image image_resized"
+  style="width:66.12%;">
+    <img style="aspect-ratio:1161/480;" src="2_Installing Ollama_image.png"
+    width="1161" height="480">
+  </figure>
+  <p>Also, you should have access to the <code>ollama</code> CLI via Powershell
+    or CMD:</p>
+  <figure class="image image_resized" style="width:86.09%;">
+    <img style="aspect-ratio:1730/924;" src="5_Installing Ollama_image.png"
+    width="1730" height="924">
+  </figure>
+  <p>After Ollama is installed, you can go ahead and <code>pull</code> the models
+    you want to use and run. Here's a command to pull my favorite tool-compatible
+    model and embedding model as of April 2025:</p><pre><code class="language-text-x-trilium-auto">ollama pull llama3.1:8b
+ollama pull mxbai-embed-large</code></pre>
+  <p>Also, you can make sure it's running by going to <a href="http://localhost:11434">http://localhost:11434</a> and
+    you should get the following response (port 11434 being the “normal” Ollama
+    port):</p>
+  <figure class="image">
+    <img style="aspect-ratio:585/202;" src="4_Installing Ollama_image.png"
+    width="585" height="202">
+  </figure>
+  <p>Now that you have Ollama up and running, have a few models pulled, you're
+    ready to go to go ahead and start using Ollama as both a chat provider,
+    and embedding provider!</p>
\ No newline at end of file
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/Installing Ollama_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/Installing Ollama_image.png
new file mode 100644
index 000000000..cf5ee38d4
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/Ollama/Installing Ollama_image.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/OpenAI.html b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information/OpenAI.html
new file mode 100644
index 000000000..e69de29bb
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information_im.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information_im.png
new file mode 100644
index 000000000..aa19e949d
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/AI Provider Information_im.png differ
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/Introduction.html b/src/public/app/doc_notes/en/User Guide/User Guide/AI/Introduction.html
new file mode 100644
index 000000000..b873f9ca9
--- /dev/null
+++ b/src/public/app/doc_notes/en/User Guide/User Guide/AI/Introduction.html	
@@ -0,0 +1,161 @@
+<figure class="image image_resized" style="width:63.68%;">
+  <img style="aspect-ratio:1363/1364;" src="Introduction_image.png" width="1363"
+  height="1364">
+  <figcaption>An example chat with an LLM</figcaption>
+</figure>
+<p>The AI / LLM features within Trilium Notes are designed to allow you to
+  interact with your Notes in a variety of ways, using as many of the major
+  providers as we can support.&nbsp;</p>
+<p>In addition to being able to send chats to LLM providers such as OpenAI,
+  Anthropic, and Ollama - we also support agentic tool calling, and embeddings.</p>
+<p>The quickest way to get started is to navigate to the “AI/LLM” settings:</p>
+<figure
+class="image image_resized" style="width:74.04%;">
+  <img style="aspect-ratio:1916/1906;" src="5_Introduction_image.png" width="1916"
+  height="1906">
+  </figure>
+  <p>Enable the feature:</p>
+  <figure class="image image_resized" style="width:82.82%;">
+    <img style="aspect-ratio:1911/997;" src="1_Introduction_image.png" width="1911"
+    height="997">
+  </figure>
+  
+<h2>Embeddings</h2>
+  <p><strong>Embeddings</strong> are important as it allows us to have an compact
+    AI “summary” (it's not human readable text) of each of your Notes, that
+    we can then perform mathematical functions on (such as cosine similarity)
+    to smartly figure out which Notes to send as context to the LLM when you're
+    chatting, among other useful functions.</p>
+  <p>You will then need to set up the AI “provider” that you wish to use to
+    create the embeddings for your Notes. Currently OpenAI, Voyage AI, and
+    Ollama are supported providers for embedding generation.</p>
+  <p>In the following example, we're going to use our self-hosted Ollama instance
+    to create the embeddings for our Notes. You can see additional documentation
+    about installing your own Ollama locally in&nbsp;<a class="reference-link"
+    href="#root/_help_vvUCN7FDkq7G">Installing Ollama</a>.</p>
+  <p>To see what embedding models Ollama has available, you can check out
+    <a
+    href="https://ollama.com/search?c=embedding">this search</a>on their website, and then <code>pull</code> whichever one
+      you want to try out. As of 4/15/25, my personal favorite is <code>mxbai-embed-large</code>.</p>
+  <p>First, we'll need to select the Ollama provider from the tabs of providers,
+    then we will enter in the Base URL for our Ollama. Since our Ollama is
+    running on our local machine, our Base URL is <code>http://localhost:11434</code>.
+    We will then hit the “refresh” button to have it fetch our models:</p>
+  <figure
+  class="image image_resized" style="width:82.28%;">
+    <img style="aspect-ratio:1912/1075;" src="4_Introduction_image.png" width="1912"
+    height="1075">
+    </figure>
+    <p>When selecting the dropdown for the “Embedding Model”, embedding models
+      should be at the top of the list, separated by regular chat models with
+      a horizontal line, as seen below:</p>
+    <figure class="image image_resized"
+    style="width:61.73%;">
+      <img style="aspect-ratio:1232/959;" src="8_Introduction_image.png" width="1232"
+      height="959">
+    </figure>
+    <p>After selecting an embedding model, embeddings should automatically begin
+      to be generated by checking the embedding statistics at the top of the
+      “AI/LLM” settings panel:</p>
+    <figure class="image image_resized" style="width:67.06%;">
+      <img style="aspect-ratio:1333/499;" src="7_Introduction_image.png" width="1333"
+      height="499">
+    </figure>
+    <p>If you don't see any embeddings being created, you will want to scroll
+      to the bottom of the settings, and hit “Recreate All Embeddings”:</p>
+    <figure
+    class="image image_resized" style="width:65.69%;">
+      <img style="aspect-ratio:1337/1490;" src="3_Introduction_image.png" width="1337"
+      height="1490">
+      </figure>
+      <p>Creating the embeddings will take some time, and will be regenerated when
+        a Note is created, updated, or deleted (removed).</p>
+      <p>If for some reason you choose to change your embedding provider, or the
+        model used, you'll need to recreate all embeddings.</p>
+      <h2>Tools</h2>
+      <p>Tools are essentially functions that we provide to the various LLM providers,
+        and then LLMs can respond in a specific format that tells us what tool
+        function and parameters they would like to invoke. We then execute these
+        tools, and provide it as additional context in the Chat conversation.&nbsp;</p>
+      <p>These are the tools that currently exist, and will certainly be updated
+        to be more effectively (and even more to be added!):</p>
+      <ul>
+        <li><code>search_notes</code>
+          <ul>
+            <li>Semantic search</li>
+          </ul>
+        </li>
+        <li><code>keyword_search</code>
+          <ul>
+            <li>Keyword-based search</li>
+          </ul>
+        </li>
+        <li><code>attribute_search</code>
+          <ul>
+            <li>Attribute-specific search</li>
+          </ul>
+        </li>
+        <li><code>search_suggestion</code>
+          <ul>
+            <li>Search syntax helper</li>
+          </ul>
+        </li>
+        <li><code>read_note</code>
+          <ul>
+            <li>Read note content (helps the LLM read Notes)</li>
+          </ul>
+        </li>
+        <li><code>create_note</code>
+          <ul>
+            <li>Create a Note</li>
+          </ul>
+        </li>
+        <li><code>update_note</code>
+          <ul>
+            <li>Update a Note</li>
+          </ul>
+        </li>
+        <li><code>manage_attributes</code>
+          <ul>
+            <li>Manage attributes on a Note</li>
+          </ul>
+        </li>
+        <li><code>manage_relationships</code>
+          <ul>
+            <li>Manage the various relationships between Notes</li>
+          </ul>
+        </li>
+        <li><code>extract_content</code>
+          <ul>
+            <li>Used to smartly extract content from a Note</li>
+          </ul>
+        </li>
+        <li><code>calendar_integration</code>
+          <ul>
+            <li>Used to find date notes, create date notes, get the daily note, etc.</li>
+          </ul>
+        </li>
+      </ul>
+      <p>When Tools are executed within your Chat, you'll see output like the following:</p>
+      <figure
+      class="image image_resized" style="width:66.88%;">
+        <img style="aspect-ratio:1372/1591;" src="6_Introduction_image.png" width="1372"
+        height="1591">
+        </figure>
+        <p>You don't need to tell the LLM to execute a certain tool, it should “smartly”
+          call tools and automatically execute them as needed.</p>
+        <h2>Overview</h2>
+        <p>Now that you know about embeddings and tools, you can just go ahead and
+          use the “Chat with Notes” button, where you can go ahead and start chatting!:</p>
+        <figure
+        class="image image_resized" style="width:60.77%;">
+          <img style="aspect-ratio:1378/539;" src="2_Introduction_image.png" width="1378"
+          height="539">
+          </figure>
+          <p>If you don't see the “Chat with Notes” button on your side launchbar,
+            you might need to move it from the “Available Launchers” section to the
+            “Visible Launchers” section:</p>
+          <figure class="image image_resized" style="width:69.81%;">
+            <img style="aspect-ratio:1765/1287;" src="9_Introduction_image.png" width="1765"
+            height="1287">
+          </figure>
\ No newline at end of file
diff --git a/src/public/app/doc_notes/en/User Guide/User Guide/AI/Introduction_image.png b/src/public/app/doc_notes/en/User Guide/User Guide/AI/Introduction_image.png
new file mode 100644
index 000000000..5a8657faf
Binary files /dev/null and b/src/public/app/doc_notes/en/User Guide/User Guide/AI/Introduction_image.png differ
diff --git a/src/public/app/entities/fnote.ts b/src/public/app/entities/fnote.ts
index 3f09b4878..e968dcae9 100644
--- a/src/public/app/entities/fnote.ts
+++ b/src/public/app/entities/fnote.ts
@@ -28,7 +28,8 @@ const NOTE_TYPE_ICONS = {
     doc: "bx bxs-file-doc",
     contentWidget: "bx bxs-widget",
     mindMap: "bx bx-sitemap",
-    geoMap: "bx bx-map-alt"
+    geoMap: "bx bx-map-alt",
+    aiChat: "bx bx-bot"
 };
 
 /**
@@ -36,7 +37,7 @@ const NOTE_TYPE_ICONS = {
  * end user. Those types should be used only for checking against, they are
  * not for direct use.
  */
-export type NoteType = "file" | "image" | "search" | "noteMap" | "launcher" | "doc" | "contentWidget" | "text" | "relationMap" | "render" | "canvas" | "mermaid" | "book" | "webView" | "code" | "mindMap" | "geoMap";
+export type NoteType = "file" | "image" | "search" | "noteMap" | "launcher" | "doc" | "contentWidget" | "text" | "relationMap" | "render" | "canvas" | "mermaid" | "book" | "webView" | "code" | "mindMap" | "geoMap" | "aiChat";
 
 export interface NotePathRecord {
     isArchived: boolean;
diff --git a/src/public/app/services/ws.ts b/src/public/app/services/ws.ts
index 7f735c458..db79b1a5e 100644
--- a/src/public/app/services/ws.ts
+++ b/src/public/app/services/ws.ts
@@ -127,6 +127,49 @@ async function handleMessage(event: MessageEvent<any>) {
         appContext.triggerEvent("apiLogMessages", { noteId: message.noteId, messages: message.messages });
     } else if (message.type === "toast") {
         toastService.showMessage(message.message);
+    } else if (message.type === "llm-stream") {
+        // ENHANCED LOGGING FOR DEBUGGING
+        console.log(`[WS-CLIENT] >>> RECEIVED LLM STREAM MESSAGE <<<`);
+        console.log(`[WS-CLIENT] Message details: sessionId=${message.sessionId}, hasContent=${!!message.content}, contentLength=${message.content ? message.content.length : 0}, hasThinking=${!!message.thinking}, hasToolExecution=${!!message.toolExecution}, isDone=${!!message.done}`);
+        
+        if (message.content) {
+            console.log(`[WS-CLIENT] CONTENT PREVIEW: "${message.content.substring(0, 50)}..."`);
+        }
+        
+        // Create the event with detailed logging
+        console.log(`[WS-CLIENT] Creating CustomEvent 'llm-stream-message'`);
+        const llmStreamEvent = new CustomEvent('llm-stream-message', { detail: message });
+        
+        // Dispatch to multiple targets to ensure delivery
+        try {
+            console.log(`[WS-CLIENT] Dispatching event to window`);
+            window.dispatchEvent(llmStreamEvent);
+            console.log(`[WS-CLIENT] Event dispatched to window`);
+            
+            // Also try document for completeness
+            console.log(`[WS-CLIENT] Dispatching event to document`);
+            document.dispatchEvent(new CustomEvent('llm-stream-message', { detail: message }));
+            console.log(`[WS-CLIENT] Event dispatched to document`);
+        } catch (err) {
+            console.error(`[WS-CLIENT] Error dispatching event:`, err);
+        }
+        
+        // Debug current listeners (though we can't directly check for specific event listeners)
+        console.log(`[WS-CLIENT] Active event listeners should receive this message now`);
+        
+        // Detailed logging based on message type
+        if (message.content) {
+            console.log(`[WS-CLIENT] Content message: ${message.content.length} chars`);
+        } else if (message.thinking) {
+            console.log(`[WS-CLIENT] Thinking update: "${message.thinking}"`);
+        } else if (message.toolExecution) {
+            console.log(`[WS-CLIENT] Tool execution: action=${message.toolExecution.action}, tool=${message.toolExecution.tool || 'unknown'}`);
+            if (message.toolExecution.result) {
+                console.log(`[WS-CLIENT] Tool result preview: "${String(message.toolExecution.result).substring(0, 50)}..."`);
+            }
+        } else if (message.done) {
+            console.log(`[WS-CLIENT] Completion signal received`);
+        }
     } else if (message.type === "execute-script") {
         // TODO: Remove after porting the file
         // @ts-ignore
diff --git a/src/public/app/widgets/buttons/ai_chat_button.ts b/src/public/app/widgets/buttons/ai_chat_button.ts
new file mode 100644
index 000000000..5ad3f8033
--- /dev/null
+++ b/src/public/app/widgets/buttons/ai_chat_button.ts
@@ -0,0 +1,26 @@
+import type { EventData } from "../../components/app_context.js";
+import type FNote from "../../entities/fnote.js";
+import options from "../../services/options.js";
+import CommandButtonWidget from "./command_button.js";
+
+export default class AiChatButton extends CommandButtonWidget {
+
+    constructor(note: FNote) {
+        super();
+
+        this.command("createAiChat")
+            .title(() => note.title)
+            .icon(() => note.getIcon())
+            .class("launcher-button");
+    }
+
+    isEnabled() {
+        return options.get("aiEnabled") === "true";
+    }
+
+    entitiesReloadedEvent({ loadResults }: EventData<"entitiesReloaded">) {
+        if (loadResults.isOptionReloaded("aiEnabled")) {
+            this.refresh();
+        }
+    }
+}
diff --git a/src/public/app/widgets/buttons/create_ai_chat_button.ts b/src/public/app/widgets/buttons/create_ai_chat_button.ts
new file mode 100644
index 000000000..1ccd52cda
--- /dev/null
+++ b/src/public/app/widgets/buttons/create_ai_chat_button.ts
@@ -0,0 +1,27 @@
+import { t } from "../../services/i18n.js";
+import options from "../../services/options.js";
+import CommandButtonWidget from "./command_button.js";
+
+export default class CreateAiChatButton extends CommandButtonWidget {
+    constructor() {
+        super();
+
+        this.icon("bx bx-bot")
+            .title(t("ai.create_new_ai_chat"))
+            .titlePlacement("bottom")
+            .command("createAiChat")
+            .class("icon-action");
+    }
+
+    isEnabled() {
+        return options.get("aiEnabled") === "true";
+    }
+
+    async refreshWithNote() {
+        if (this.isEnabled()) {
+            this.$widget.show();
+        } else {
+            this.$widget.hide();
+        }
+    }
+}
diff --git a/src/public/app/widgets/containers/launcher.ts b/src/public/app/widgets/containers/launcher.ts
index 86fbabb96..e1bfc5a8b 100644
--- a/src/public/app/widgets/containers/launcher.ts
+++ b/src/public/app/widgets/containers/launcher.ts
@@ -13,6 +13,7 @@ import HistoryNavigationButton from "../buttons/history_navigation.js";
 import QuickSearchLauncherWidget from "../quick_search_launcher.js";
 import type FNote from "../../entities/fnote.js";
 import type { CommandNames } from "../../components/app_context.js";
+import AiChatButton from "../buttons/ai_chat_button.js";
 
 interface InnerWidget extends BasicWidget {
     settings?: {
@@ -123,6 +124,8 @@ export default class LauncherWidget extends BasicWidget {
                 return new TodayLauncher(note);
             case "quickSearch":
                 return new QuickSearchLauncherWidget(this.isHorizontalLayout);
+            case "aiChatLauncher":
+                return new AiChatButton(note);
             default:
                 throw new Error(`Unrecognized builtin widget ${builtinWidget} for launcher ${note.noteId} "${note.title}"`);
         }
diff --git a/src/public/app/widgets/floating_buttons/help_button.ts b/src/public/app/widgets/floating_buttons/help_button.ts
index 3c6d969eb..ac54b9f8d 100644
--- a/src/public/app/widgets/floating_buttons/help_button.ts
+++ b/src/public/app/widgets/floating_buttons/help_button.ts
@@ -28,7 +28,8 @@ export const byNoteType: Record<Exclude<NoteType, "book">, string | null> = {
     render: null,
     search: null,
     text: null,
-    webView: null
+    webView: null,
+    aiChat: null
 };
 
 export const byBookType: Record<ViewTypeOptions, string | null> = {
diff --git a/src/public/app/widgets/llm_chat/communication.ts b/src/public/app/widgets/llm_chat/communication.ts
new file mode 100644
index 000000000..bb58a47b2
--- /dev/null
+++ b/src/public/app/widgets/llm_chat/communication.ts
@@ -0,0 +1,495 @@
+/**
+ * Communication functions for LLM Chat
+ */
+import server from "../../services/server.js";
+import type { SessionResponse } from "./types.js";
+
+/**
+ * Create a new chat session
+ */
+export async function createChatSession(currentNoteId?: string): Promise<{chatNoteId: string | null, noteId: string | null}> {
+    try {
+        const resp = await server.post<SessionResponse>('llm/chat', {
+            title: 'Note Chat',
+            currentNoteId: currentNoteId // Pass the current note ID if available
+        });
+
+        if (resp && resp.id) {
+            // The backend might provide the noteId separately from the chatNoteId
+            // If noteId is provided, use it; otherwise, we'll need to query for it separately
+            return {
+                chatNoteId: resp.id,
+                noteId: resp.noteId || null
+            };
+        }
+    } catch (error) {
+        console.error('Failed to create chat session:', error);
+    }
+
+    return {
+        chatNoteId: null,
+        noteId: null
+    };
+}
+
+/**
+ * Check if a session exists
+ */
+export async function checkSessionExists(chatNoteId: string): Promise<boolean> {
+    try {
+        // Validate that we have a proper note ID format, not a session ID
+        // Note IDs in Trilium are typically longer or in a different format
+        if (chatNoteId && chatNoteId.length === 16 && /^[A-Za-z0-9]+$/.test(chatNoteId)) {
+            console.warn(`Invalid note ID format detected: ${chatNoteId} appears to be a legacy session ID`);
+            return false;
+        }
+
+        const sessionCheck = await server.getWithSilentNotFound<any>(`llm/chat/${chatNoteId}`);
+        return !!(sessionCheck && sessionCheck.id);
+    } catch (error: any) {
+        console.log(`Error checking chat note ${chatNoteId}:`, error);
+        return false;
+    }
+}
+
+/**
+ * Set up streaming response via WebSocket
+ */
+export async function setupStreamingResponse(
+    chatNoteId: string,
+    messageParams: any,
+    onContentUpdate: (content: string, isDone?: boolean) => void,
+    onThinkingUpdate: (thinking: string) => void,
+    onToolExecution: (toolData: any) => void,
+    onComplete: () => void,
+    onError: (error: Error) => void
+): Promise<void> {
+    // Validate that we have a proper note ID format, not a session ID
+    if (chatNoteId && chatNoteId.length === 16 && /^[A-Za-z0-9]+$/.test(chatNoteId)) {
+        console.error(`Invalid note ID format: ${chatNoteId} appears to be a legacy session ID`);
+        onError(new Error("Invalid note ID format - using a legacy session ID"));
+        return;
+    }
+
+    return new Promise((resolve, reject) => {
+        let assistantResponse = '';
+        let postToolResponse = ''; // Separate accumulator for post-tool execution content
+        let receivedAnyContent = false;
+        let receivedPostToolContent = false; // Track if we've started receiving post-tool content
+        let timeoutId: number | null = null;
+        let initialTimeoutId: number | null = null;
+        let cleanupTimeoutId: number | null = null;
+        let receivedAnyMessage = false;
+        let toolsExecuted = false; // Flag to track if tools were executed in this session
+        let toolExecutionCompleted = false; // Flag to track if tool execution is completed
+        let eventListener: ((event: Event) => void) | null = null;
+        let lastMessageTimestamp = 0;
+
+        // Create a unique identifier for this response process
+        const responseId = `llm-stream-${Date.now()}-${Math.floor(Math.random() * 1000)}`;
+        console.log(`[${responseId}] Setting up WebSocket streaming for chat note ${chatNoteId}`);
+
+        // Send the initial request to initiate streaming
+        (async () => {
+            try {
+                const streamResponse = await server.post<any>(`llm/chat/${chatNoteId}/messages/stream`, {
+                    content: messageParams.content,
+                    useAdvancedContext: messageParams.useAdvancedContext,
+                    showThinking: messageParams.showThinking,
+                    options: {
+                        temperature: 0.7,
+                        maxTokens: 2000
+                    }
+                });
+
+                if (!streamResponse || !streamResponse.success) {
+                    console.error(`[${responseId}] Failed to initiate streaming`);
+                    reject(new Error('Failed to initiate streaming'));
+                    return;
+                }
+
+                console.log(`[${responseId}] Streaming initiated successfully`);
+            } catch (error) {
+                console.error(`[${responseId}] Error initiating streaming:`, error);
+                reject(error);
+                return;
+            }
+        })();
+
+        // Function to safely perform cleanup
+        const performCleanup = () => {
+            if (cleanupTimeoutId) {
+                window.clearTimeout(cleanupTimeoutId);
+                cleanupTimeoutId = null;
+            }
+
+            console.log(`[${responseId}] Performing final cleanup of event listener`);
+            cleanupEventListener(eventListener);
+            onComplete();
+            resolve();
+        };
+
+        // Function to schedule cleanup with ability to cancel
+        const scheduleCleanup = (delay: number) => {
+            // Clear any existing cleanup timeout
+            if (cleanupTimeoutId) {
+                window.clearTimeout(cleanupTimeoutId);
+            }
+
+            console.log(`[${responseId}] Scheduling listener cleanup in ${delay}ms`);
+
+            // Set new cleanup timeout
+            cleanupTimeoutId = window.setTimeout(() => {
+                // Only clean up if no messages received recently (in last 2 seconds)
+                const timeSinceLastMessage = Date.now() - lastMessageTimestamp;
+                if (timeSinceLastMessage > 2000) {
+                    performCleanup();
+                } else {
+                    console.log(`[${responseId}] Received message recently, delaying cleanup`);
+                    // Reschedule cleanup
+                    scheduleCleanup(2000);
+                }
+            }, delay);
+        };
+
+        // Create a message handler for CustomEvents
+        eventListener = (event: Event) => {
+            const customEvent = event as CustomEvent;
+            const message = customEvent.detail;
+
+            // Only process messages for our chat note
+            if (!message || message.chatNoteId !== chatNoteId) {
+                return;
+            }
+
+            // Update last message timestamp
+            lastMessageTimestamp = Date.now();
+
+            // Cancel any pending cleanup when we receive a new message
+            if (cleanupTimeoutId) {
+                console.log(`[${responseId}] Cancelling scheduled cleanup due to new message`);
+                window.clearTimeout(cleanupTimeoutId);
+                cleanupTimeoutId = null;
+            }
+
+            console.log(`[${responseId}] LLM Stream message received via CustomEvent: chatNoteId=${chatNoteId}, content=${!!message.content}, contentLength=${message.content?.length || 0}, thinking=${!!message.thinking}, toolExecution=${!!message.toolExecution}, done=${!!message.done}, type=${message.type || 'llm-stream'}`);
+
+            // Mark first message received
+            if (!receivedAnyMessage) {
+                receivedAnyMessage = true;
+                console.log(`[${responseId}] First message received for chat note ${chatNoteId}`);
+
+                // Clear the initial timeout since we've received a message
+                if (initialTimeoutId !== null) {
+                    window.clearTimeout(initialTimeoutId);
+                    initialTimeoutId = null;
+                }
+            }
+
+            // Handle specific message types
+            if (message.type === 'tool_execution_start') {
+                toolsExecuted = true; // Mark that tools were executed
+                onThinkingUpdate('Executing tools...');
+                // Also trigger tool execution UI with a specific format
+                onToolExecution({
+                    action: 'start',
+                    tool: 'tools',
+                    result: 'Executing tools...'
+                });
+                return; // Skip accumulating content from this message
+            }
+
+            if (message.type === 'tool_result' && message.toolExecution) {
+                toolsExecuted = true; // Mark that tools were executed
+                console.log(`[${responseId}] Processing tool result: ${JSON.stringify(message.toolExecution)}`);
+
+                // If tool execution doesn't have an action, add 'result' as the default
+                if (!message.toolExecution.action) {
+                    message.toolExecution.action = 'result';
+                }
+
+                // First send a 'start' action to ensure the container is created
+                onToolExecution({
+                    action: 'start',
+                    tool: 'tools',
+                    result: 'Tool execution initialized'
+                });
+
+                // Then send the actual tool execution data
+                onToolExecution(message.toolExecution);
+
+                // Mark tool execution as completed if this is a result or error
+                if (message.toolExecution.action === 'result' || message.toolExecution.action === 'complete' || message.toolExecution.action === 'error') {
+                    toolExecutionCompleted = true;
+                    console.log(`[${responseId}] Tool execution completed`);
+                }
+
+                return; // Skip accumulating content from this message
+            }
+
+            if (message.type === 'tool_execution_error' && message.toolExecution) {
+                toolsExecuted = true; // Mark that tools were executed
+                toolExecutionCompleted = true; // Mark tool execution as completed
+                onToolExecution({
+                    ...message.toolExecution,
+                    action: 'error',
+                    error: message.toolExecution.error || 'Unknown error during tool execution'
+                });
+                return; // Skip accumulating content from this message
+            }
+
+            if (message.type === 'tool_completion_processing') {
+                toolsExecuted = true; // Mark that tools were executed
+                toolExecutionCompleted = true; // Tools are done, now processing the result
+                onThinkingUpdate('Generating response with tool results...');
+                // Also trigger tool execution UI with a specific format
+                onToolExecution({
+                    action: 'generating',
+                    tool: 'tools',
+                    result: 'Generating response with tool results...'
+                });
+                return; // Skip accumulating content from this message
+            }
+
+            // Handle content updates
+            if (message.content) {
+                console.log(`[${responseId}] Received content chunk of length ${message.content.length}, preview: "${message.content.substring(0, 50)}${message.content.length > 50 ? '...' : ''}"`);
+
+                // If tools were executed and completed, and we're now getting new content,
+                // this is likely the final response after tool execution from Anthropic
+                if (toolsExecuted && toolExecutionCompleted && message.content) {
+                    console.log(`[${responseId}] Post-tool execution content detected`);
+
+                    // If this is the first post-tool chunk, indicate we're starting a new response
+                    if (!receivedPostToolContent) {
+                        receivedPostToolContent = true;
+                        postToolResponse = ''; // Clear any previous post-tool response
+                        console.log(`[${responseId}] First post-tool content chunk, starting fresh accumulation`);
+                    }
+
+                    // Accumulate post-tool execution content
+                    postToolResponse += message.content;
+                    console.log(`[${responseId}] Accumulated post-tool content, now ${postToolResponse.length} chars`);
+
+                    // Update the UI with the accumulated post-tool content
+                    // This replaces the pre-tool content with our accumulated post-tool content
+                    onContentUpdate(postToolResponse, message.done || false);
+                } else {
+                    // Standard content handling for non-tool cases or initial tool response
+
+                    // Check if this is a duplicated message containing the same content we already have
+                    if (message.done && assistantResponse.includes(message.content)) {
+                        console.log(`[${responseId}] Ignoring duplicated content in done message`);
+                    } else {
+                        // Add to our accumulated response
+                        assistantResponse += message.content;
+                    }
+
+                    // Update the UI immediately with each chunk
+                    onContentUpdate(assistantResponse, message.done || false);
+                }
+
+                receivedAnyContent = true;
+
+                // Reset timeout since we got content
+                if (timeoutId !== null) {
+                    window.clearTimeout(timeoutId);
+                }
+
+                // Set new timeout
+                timeoutId = window.setTimeout(() => {
+                    console.warn(`[${responseId}] Stream timeout for chat note ${chatNoteId}`);
+
+                    // Clean up
+                    performCleanup();
+                    reject(new Error('Stream timeout'));
+                }, 30000);
+            }
+
+            // Handle tool execution updates (legacy format and standard format with llm-stream type)
+            if (message.toolExecution) {
+                // Only process if we haven't already handled this message via specific message types
+                if (message.type === 'llm-stream' || !message.type) {
+                    console.log(`[${responseId}] Received tool execution update: action=${message.toolExecution.action || 'unknown'}`);
+                    toolsExecuted = true; // Mark that tools were executed
+
+                    // Mark tool execution as completed if this is a result or error
+                    if (message.toolExecution.action === 'result' ||
+                        message.toolExecution.action === 'complete' ||
+                        message.toolExecution.action === 'error') {
+                        toolExecutionCompleted = true;
+                        console.log(`[${responseId}] Tool execution completed via toolExecution message`);
+                    }
+
+                    onToolExecution(message.toolExecution);
+                }
+            }
+
+            // Handle tool calls from the raw data or direct in message (OpenAI format)
+            const toolCalls = message.tool_calls || (message.raw && message.raw.tool_calls);
+            if (toolCalls && Array.isArray(toolCalls)) {
+                console.log(`[${responseId}] Received tool calls: ${toolCalls.length} tools`);
+                toolsExecuted = true; // Mark that tools were executed
+
+                // First send a 'start' action to ensure the container is created
+                onToolExecution({
+                    action: 'start',
+                    tool: 'tools',
+                    result: 'Tool execution initialized'
+                });
+
+                // Then process each tool call
+                for (const toolCall of toolCalls) {
+                    let args = toolCall.function?.arguments || {};
+
+                    // Try to parse arguments if they're a string
+                    if (typeof args === 'string') {
+                        try {
+                            args = JSON.parse(args);
+                        } catch (e) {
+                            console.log(`[${responseId}] Could not parse tool arguments as JSON: ${e}`);
+                            args = { raw: args };
+                        }
+                    }
+
+                    onToolExecution({
+                        action: 'executing',
+                        tool: toolCall.function?.name || 'unknown',
+                        toolCallId: toolCall.id,
+                        args: args
+                    });
+                }
+            }
+
+            // Handle thinking state updates
+            if (message.thinking) {
+                console.log(`[${responseId}] Received thinking update: ${message.thinking.substring(0, 50)}...`);
+                onThinkingUpdate(message.thinking);
+            }
+
+            // Handle completion
+            if (message.done) {
+                console.log(`[${responseId}] Stream completed for chat note ${chatNoteId}, has content: ${!!message.content}, content length: ${message.content?.length || 0}, current response: ${assistantResponse.length} chars`);
+
+                // Dump message content to console for debugging
+                if (message.content) {
+                    console.log(`[${responseId}] CONTENT IN DONE MESSAGE (first 200 chars): "${message.content.substring(0, 200)}..."`);
+
+                    // Check if the done message contains the exact same content as our accumulated response
+                    // We normalize by removing whitespace to avoid false negatives due to spacing differences
+                    const normalizedMessage = message.content.trim();
+                    const normalizedResponse = assistantResponse.trim();
+
+                    if (normalizedMessage === normalizedResponse) {
+                        console.log(`[${responseId}] Final message is identical to accumulated response, no need to update`);
+                    }
+                    // If the done message is longer but contains our accumulated response, use the done message
+                    else if (normalizedMessage.includes(normalizedResponse) && normalizedMessage.length > normalizedResponse.length) {
+                        console.log(`[${responseId}] Final message is more complete than accumulated response, using it`);
+                        assistantResponse = message.content;
+                    }
+                    // If the done message is different and not already included, append it to avoid duplication
+                    else if (!normalizedResponse.includes(normalizedMessage) && normalizedMessage.length > 0) {
+                        console.log(`[${responseId}] Final message has unique content, using it`);
+                        assistantResponse = message.content;
+                    }
+                    // Otherwise, we already have the content accumulated, so no need to update
+                    else {
+                        console.log(`[${responseId}] Already have this content accumulated, not updating`);
+                    }
+                }
+
+                // Clear timeout if set
+                if (timeoutId !== null) {
+                    window.clearTimeout(timeoutId);
+                    timeoutId = null;
+                }
+
+                // Always mark as done when we receive the done flag
+                onContentUpdate(assistantResponse, true);
+
+                // Set a longer delay before cleanup to allow for post-tool execution messages
+                // Especially important for Anthropic which may send final message after tool execution
+                const cleanupDelay = toolsExecuted ? 15000 : 1000; // 15 seconds if tools were used, otherwise 1 second
+                console.log(`[${responseId}] Setting cleanup delay of ${cleanupDelay}ms since toolsExecuted=${toolsExecuted}`);
+                scheduleCleanup(cleanupDelay);
+            }
+        };
+
+        // Register event listener for the custom event
+        try {
+            window.addEventListener('llm-stream-message', eventListener);
+            console.log(`[${responseId}] Event listener added for llm-stream-message events`);
+        } catch (err) {
+            console.error(`[${responseId}] Error setting up event listener:`, err);
+            reject(err);
+            return;
+        }
+
+        // Set initial timeout for receiving any message
+        initialTimeoutId = window.setTimeout(() => {
+            console.warn(`[${responseId}] No messages received for initial period in chat note ${chatNoteId}`);
+            if (!receivedAnyMessage) {
+                console.error(`[${responseId}] WebSocket connection not established for chat note ${chatNoteId}`);
+
+                if (timeoutId !== null) {
+                    window.clearTimeout(timeoutId);
+                }
+
+                // Clean up
+                cleanupEventListener(eventListener);
+
+                // Show error message to user
+                reject(new Error('WebSocket connection not established'));
+            }
+        }, 10000);
+    });
+}
+
+/**
+ * Clean up an event listener
+ */
+function cleanupEventListener(listener: ((event: Event) => void) | null): void {
+    if (listener) {
+        try {
+            window.removeEventListener('llm-stream-message', listener);
+            console.log(`Successfully removed event listener`);
+        } catch (err) {
+            console.error(`Error removing event listener:`, err);
+        }
+    }
+}
+
+/**
+ * Get a direct response from the server without streaming
+ */
+export async function getDirectResponse(chatNoteId: string, messageParams: any): Promise<any> {
+    try {
+        // Validate that we have a proper note ID format, not a session ID
+        if (chatNoteId && chatNoteId.length === 16 && /^[A-Za-z0-9]+$/.test(chatNoteId)) {
+            console.error(`Invalid note ID format: ${chatNoteId} appears to be a legacy session ID`);
+            throw new Error("Invalid note ID format - using a legacy session ID");
+        }
+
+        const postResponse = await server.post<any>(`llm/chat/${chatNoteId}/messages`, {
+            message: messageParams.content,
+            includeContext: messageParams.useAdvancedContext,
+            options: {
+                temperature: 0.7,
+                maxTokens: 2000
+            }
+        });
+
+        return postResponse;
+    } catch (error) {
+        console.error('Error getting direct response:', error);
+        throw error;
+    }
+}
+
+/**
+ * Get embedding statistics
+ */
+export async function getEmbeddingStats(): Promise<any> {
+    return server.get('llm/embeddings/stats');
+}
diff --git a/src/public/app/widgets/llm_chat/index.ts b/src/public/app/widgets/llm_chat/index.ts
new file mode 100644
index 000000000..8f0eb9f2d
--- /dev/null
+++ b/src/public/app/widgets/llm_chat/index.ts
@@ -0,0 +1,6 @@
+/**
+ * LLM Chat Panel Widget Module
+ */
+import LlmChatPanel from './llm_chat_panel.js';
+
+export default LlmChatPanel;
diff --git a/src/public/app/widgets/llm_chat/llm_chat_panel.ts b/src/public/app/widgets/llm_chat/llm_chat_panel.ts
new file mode 100644
index 000000000..3554773d7
--- /dev/null
+++ b/src/public/app/widgets/llm_chat/llm_chat_panel.ts
@@ -0,0 +1,1234 @@
+/**
+ * LLM Chat Panel Widget
+ */
+import BasicWidget from "../basic_widget.js";
+import toastService from "../../services/toast.js";
+import appContext from "../../components/app_context.js";
+import server from "../../services/server.js";
+
+import { TPL, addMessageToChat, showSources, hideSources, showLoadingIndicator, hideLoadingIndicator } from "./ui.js";
+import { formatMarkdown } from "./utils.js";
+import { createChatSession, checkSessionExists, setupStreamingResponse, getDirectResponse } from "./communication.js";
+import { extractInChatToolSteps } from "./message_processor.js";
+import { validateEmbeddingProviders } from "./validation.js";
+import type { MessageData, ToolExecutionStep, ChatData } from "./types.js";
+import { applySyntaxHighlight } from "../../services/syntax_highlight.js";
+
+import "../../../stylesheets/llm_chat.css";
+
+export default class LlmChatPanel extends BasicWidget {
+    private noteContextChatMessages!: HTMLElement;
+    private noteContextChatForm!: HTMLFormElement;
+    private noteContextChatInput!: HTMLTextAreaElement;
+    private noteContextChatSendButton!: HTMLButtonElement;
+    private chatContainer!: HTMLElement;
+    private loadingIndicator!: HTMLElement;
+    private sourcesList!: HTMLElement;
+    private sourcesContainer!: HTMLElement;
+    private sourcesCount!: HTMLElement;
+    private useAdvancedContextCheckbox!: HTMLInputElement;
+    private showThinkingCheckbox!: HTMLInputElement;
+    private validationWarning!: HTMLElement;
+    private chatNoteId: string | null = null;
+    private noteId: string | null = null; // The actual noteId for the Chat Note
+    private currentNoteId: string | null = null;
+    private _messageHandlerId: number | null = null;
+    private _messageHandler: any = null;
+
+    // Callbacks for data persistence
+    private onSaveData: ((data: any) => Promise<void>) | null = null;
+    private onGetData: (() => Promise<any>) | null = null;
+    private messages: MessageData[] = [];
+    private sources: Array<{noteId: string; title: string; similarity?: number; content?: string}> = [];
+    private metadata: {
+        model?: string;
+        provider?: string;
+        temperature?: number;
+        maxTokens?: number;
+        toolExecutions?: Array<{
+            id: string;
+            name: string;
+            arguments: any;
+            result: any;
+            error?: string;
+            timestamp: string;
+        }>;
+        lastUpdated?: string;
+        usage?: {
+            promptTokens?: number;
+            completionTokens?: number;
+            totalTokens?: number;
+        };
+    } = {
+        model: 'default',
+        temperature: 0.7,
+        toolExecutions: []
+    };
+
+    // Public getters and setters for private properties
+    public getCurrentNoteId(): string | null {
+        return this.currentNoteId;
+    }
+
+    public setCurrentNoteId(noteId: string | null): void {
+        this.currentNoteId = noteId;
+    }
+
+    public getMessages(): MessageData[] {
+        return this.messages;
+    }
+
+    public setMessages(messages: MessageData[]): void {
+        this.messages = messages;
+    }
+
+    public getChatNoteId(): string | null {
+        return this.chatNoteId;
+    }
+
+    public setChatNoteId(chatNoteId: string | null): void {
+        this.chatNoteId = chatNoteId;
+    }
+
+    public getNoteContextChatMessages(): HTMLElement {
+        return this.noteContextChatMessages;
+    }
+
+    public clearNoteContextChatMessages(): void {
+        this.noteContextChatMessages.innerHTML = '';
+    }
+
+    doRender() {
+        this.$widget = $(TPL);
+
+        const element = this.$widget[0];
+        this.noteContextChatMessages = element.querySelector('.note-context-chat-messages') as HTMLElement;
+        this.noteContextChatForm = element.querySelector('.note-context-chat-form') as HTMLFormElement;
+        this.noteContextChatInput = element.querySelector('.note-context-chat-input') as HTMLTextAreaElement;
+        this.noteContextChatSendButton = element.querySelector('.note-context-chat-send-button') as HTMLButtonElement;
+        this.chatContainer = element.querySelector('.note-context-chat-container') as HTMLElement;
+        this.loadingIndicator = element.querySelector('.loading-indicator') as HTMLElement;
+        this.sourcesList = element.querySelector('.sources-list') as HTMLElement;
+        this.sourcesContainer = element.querySelector('.sources-container') as HTMLElement;
+        this.sourcesCount = element.querySelector('.sources-count') as HTMLElement;
+        this.useAdvancedContextCheckbox = element.querySelector('.use-advanced-context-checkbox') as HTMLInputElement;
+        this.showThinkingCheckbox = element.querySelector('.show-thinking-checkbox') as HTMLInputElement;
+        this.validationWarning = element.querySelector('.provider-validation-warning') as HTMLElement;
+
+        // Set up event delegation for the settings link
+        this.validationWarning.addEventListener('click', (e) => {
+            const target = e.target as HTMLElement;
+            if (target.classList.contains('settings-link') || target.closest('.settings-link')) {
+                console.log('Settings link clicked, navigating to AI settings URL');
+                window.location.href = '#root/_hidden/_options/_optionsAi';
+            }
+        });
+
+        this.initializeEventListeners();
+
+        return this.$widget;
+    }
+
+    cleanup() {
+        console.log(`LlmChatPanel cleanup called, removing any active WebSocket subscriptions`);
+        this._messageHandler = null;
+        this._messageHandlerId = null;
+    }
+
+    /**
+     * Set the callbacks for data persistence
+     */
+    setDataCallbacks(
+        saveDataCallback: (data: any) => Promise<void>,
+        getDataCallback: () => Promise<any>
+    ) {
+        this.onSaveData = saveDataCallback;
+        this.onGetData = getDataCallback;
+    }
+
+    /**
+     * Save current chat data to the note attribute
+     */
+    async saveCurrentData() {
+        if (!this.onSaveData) {
+            return;
+        }
+
+        try {
+            // Extract current tool execution steps if any exist
+            const toolSteps = extractInChatToolSteps(this.noteContextChatMessages);
+
+            // Get tool executions from both UI and any cached executions in metadata
+            let toolExecutions: Array<{
+                id: string;
+                name: string;
+                arguments: any;
+                result: any;
+                error?: string;
+                timestamp: string;
+            }> = [];
+
+            // First include any tool executions already in metadata (from streaming events)
+            if (this.metadata?.toolExecutions && Array.isArray(this.metadata.toolExecutions)) {
+                toolExecutions = [...this.metadata.toolExecutions];
+                console.log(`Including ${toolExecutions.length} tool executions from metadata`);
+            }
+
+            // Also extract any visible tool steps from the UI
+            const extractedExecutions = toolSteps.map(step => {
+                // Parse tool execution information
+                if (step.type === 'tool-execution') {
+                    try {
+                        const content = JSON.parse(step.content);
+                        return {
+                            id: content.toolCallId || `tool-${Date.now()}-${Math.random().toString(36).substring(2, 7)}`,
+                            name: content.tool || 'unknown',
+                            arguments: content.args || {},
+                            result: content.result || {},
+                            error: content.error,
+                            timestamp: new Date().toISOString()
+                        };
+                    } catch (e) {
+                        // If we can't parse it, create a basic record
+                        return {
+                            id: `tool-${Date.now()}-${Math.random().toString(36).substring(2, 7)}`,
+                            name: 'unknown',
+                            arguments: {},
+                            result: step.content,
+                            timestamp: new Date().toISOString()
+                        };
+                    }
+                } else if (step.type === 'result' && step.name) {
+                    // Handle result steps with a name
+                    return {
+                        id: `tool-${Date.now()}-${Math.random().toString(36).substring(2, 7)}`,
+                        name: step.name,
+                        arguments: {},
+                        result: step.content,
+                        timestamp: new Date().toISOString()
+                    };
+                }
+                return {
+                    id: `tool-${Date.now()}-${Math.random().toString(36).substring(2, 7)}`,
+                    name: 'unknown',
+                    arguments: {},
+                    result: 'Unrecognized tool step',
+                    timestamp: new Date().toISOString()
+                };
+            });
+
+            // Merge the tool executions, keeping only unique IDs
+            const existingIds = new Set(toolExecutions.map((t: {id: string}) => t.id));
+            for (const exec of extractedExecutions) {
+                if (!existingIds.has(exec.id)) {
+                    toolExecutions.push(exec);
+                    existingIds.add(exec.id);
+                }
+            }
+
+            const dataToSave: ChatData = {
+                messages: this.messages,
+                chatNoteId: this.chatNoteId,
+                noteId: this.noteId,
+                toolSteps: toolSteps,
+                // Add sources if we have them
+                sources: this.sources || [],
+                // Add metadata
+                metadata: {
+                    model: this.metadata?.model || 'default',
+                    provider: this.metadata?.provider || undefined,
+                    temperature: this.metadata?.temperature || 0.7,
+                    lastUpdated: new Date().toISOString(),
+                    // Add tool executions
+                    toolExecutions: toolExecutions
+                }
+            };
+
+            console.log(`Saving chat data with chatNoteId: ${this.chatNoteId}, noteId: ${this.noteId}, ${toolSteps.length} tool steps, ${this.sources?.length || 0} sources, ${toolExecutions.length} tool executions`);
+
+            // Save the data to the note attribute via the callback
+            // This is the ONLY place we should save data, letting the container widget handle persistence
+            await this.onSaveData(dataToSave);
+        } catch (error) {
+            console.error('Error saving chat data:', error);
+        }
+    }
+
+    /**
+     * Load saved chat data from the note attribute
+     */
+    async loadSavedData(): Promise<boolean> {
+        if (!this.onGetData) {
+            return false;
+        }
+
+        try {
+            const savedData = await this.onGetData() as ChatData;
+
+            if (savedData?.messages?.length > 0) {
+                // Load messages
+                this.messages = savedData.messages;
+
+                // Clear and rebuild the chat UI
+                this.noteContextChatMessages.innerHTML = '';
+
+                this.messages.forEach(message => {
+                    const role = message.role as 'user' | 'assistant';
+                    this.addMessageToChat(role, message.content);
+                });
+
+                // Restore tool execution steps if they exist
+                if (savedData.toolSteps && Array.isArray(savedData.toolSteps) && savedData.toolSteps.length > 0) {
+                    console.log(`Restoring ${savedData.toolSteps.length} saved tool steps`);
+                    this.restoreInChatToolSteps(savedData.toolSteps);
+                }
+
+                // Load sources if available
+                if (savedData.sources && Array.isArray(savedData.sources)) {
+                    this.sources = savedData.sources;
+                    console.log(`Loaded ${this.sources.length} sources from saved data`);
+
+                    // Show sources in the UI if they exist
+                    if (this.sources.length > 0) {
+                        this.showSources(this.sources);
+                    }
+                }
+
+                // Load metadata if available
+                if (savedData.metadata) {
+                    this.metadata = {
+                        ...this.metadata,
+                        ...savedData.metadata
+                    };
+
+                    // Ensure tool executions are loaded
+                    if (savedData.metadata.toolExecutions && Array.isArray(savedData.metadata.toolExecutions)) {
+                        console.log(`Loaded ${savedData.metadata.toolExecutions.length} tool executions from saved data`);
+
+                        if (!this.metadata.toolExecutions) {
+                            this.metadata.toolExecutions = [];
+                        }
+
+                        // Make sure we don't lose any tool executions
+                        this.metadata.toolExecutions = savedData.metadata.toolExecutions;
+                    }
+
+                    console.log(`Loaded metadata from saved data:`, this.metadata);
+                }
+
+                // Load Chat Note ID if available
+                if (savedData.noteId) {
+                    console.log(`Using noteId as Chat Note ID: ${savedData.noteId}`);
+                    this.chatNoteId = savedData.noteId;
+                    this.noteId = savedData.noteId;
+                } else {
+                    console.log(`No noteId found in saved data, cannot load chat session`);
+                    return false;
+                }
+
+                return true;
+            }
+        } catch (error) {
+            console.error('Failed to load saved chat data', error);
+        }
+
+        return false;
+    }
+
+    /**
+     * Restore tool execution steps in the chat UI
+     */
+    private restoreInChatToolSteps(steps: ToolExecutionStep[]) {
+        if (!steps || steps.length === 0) return;
+
+        // Create the tool execution element
+        const toolExecutionElement = document.createElement('div');
+        toolExecutionElement.className = 'chat-tool-execution mb-3';
+
+        // Insert before the assistant message if it exists
+        const assistantMessage = this.noteContextChatMessages.querySelector('.assistant-message:last-child');
+        if (assistantMessage) {
+            this.noteContextChatMessages.insertBefore(toolExecutionElement, assistantMessage);
+        } else {
+            // Otherwise append to the end
+            this.noteContextChatMessages.appendChild(toolExecutionElement);
+        }
+
+        // Fill with tool execution content
+        toolExecutionElement.innerHTML = `
+            <div class="tool-execution-header d-flex align-items-center p-2 rounded">
+                <i class="bx bx-terminal me-2"></i>
+                <span class="flex-grow-1 fw-bold">Tool Execution</span>
+                <button type="button" class="btn btn-sm btn-link p-0 text-muted tool-execution-toggle" title="Toggle tool execution details">
+                    <i class="bx bx-chevron-down"></i>
+                </button>
+            </div>
+            <div class="tool-execution-container p-2 rounded mb-2">
+                <div class="tool-execution-chat-steps">
+                    ${this.renderToolStepsHtml(steps)}
+                </div>
+            </div>
+        `;
+
+        // Add event listener for the toggle button
+        const toggleButton = toolExecutionElement.querySelector('.tool-execution-toggle');
+        if (toggleButton) {
+            toggleButton.addEventListener('click', () => {
+                const stepsContainer = toolExecutionElement.querySelector('.tool-execution-container');
+                const icon = toggleButton.querySelector('i');
+
+                if (stepsContainer) {
+                    if (stepsContainer.classList.contains('collapsed')) {
+                        // Expand
+                        stepsContainer.classList.remove('collapsed');
+                        (stepsContainer as HTMLElement).style.display = 'block';
+                        if (icon) {
+                            icon.className = 'bx bx-chevron-down';
+                        }
+                    } else {
+                        // Collapse
+                        stepsContainer.classList.add('collapsed');
+                        (stepsContainer as HTMLElement).style.display = 'none';
+                        if (icon) {
+                            icon.className = 'bx bx-chevron-right';
+                        }
+                    }
+                }
+            });
+        }
+
+        // Add click handler for the header to toggle expansion as well
+        const header = toolExecutionElement.querySelector('.tool-execution-header');
+        if (header) {
+            header.addEventListener('click', (e) => {
+                // Only toggle if the click isn't on the toggle button itself
+                const target = e.target as HTMLElement;
+                if (target && !target.closest('.tool-execution-toggle')) {
+                    const toggleButton = toolExecutionElement.querySelector('.tool-execution-toggle');
+                    toggleButton?.dispatchEvent(new Event('click'));
+                }
+            });
+            (header as HTMLElement).style.cursor = 'pointer';
+        }
+    }
+
+    /**
+     * Render HTML for tool execution steps
+     */
+    private renderToolStepsHtml(steps: ToolExecutionStep[]): string {
+        if (!steps || steps.length === 0) return '';
+
+        return steps.map(step => {
+            let icon = 'bx-info-circle';
+            let className = 'info';
+            let content = '';
+
+            if (step.type === 'executing') {
+                icon = 'bx-code-block';
+                className = 'executing';
+                content = `<div>${step.content || 'Executing tools...'}</div>`;
+            } else if (step.type === 'result') {
+                icon = 'bx-terminal';
+                className = 'result';
+                content = `
+                    <div>Tool: <strong>${step.name || 'unknown'}</strong></div>
+                    <div class="mt-1 ps-3">${step.content || ''}</div>
+                `;
+            } else if (step.type === 'error') {
+                icon = 'bx-error-circle';
+                className = 'error';
+                content = `
+                    <div>Tool: <strong>${step.name || 'unknown'}</strong></div>
+                    <div class="mt-1 ps-3 text-danger">${step.content || 'Error occurred'}</div>
+                `;
+            } else if (step.type === 'generating') {
+                icon = 'bx-message-dots';
+                className = 'generating';
+                content = `<div>${step.content || 'Generating response...'}</div>`;
+            }
+
+            return `
+                <div class="tool-step ${className} p-2 mb-2 rounded">
+                    <div class="d-flex align-items-center">
+                        <i class="bx ${icon} me-2"></i>
+                        ${content}
+                    </div>
+                </div>
+            `;
+        }).join('');
+    }
+
+    async refresh() {
+        if (!this.isVisible()) {
+            return;
+        }
+
+        // Check for any provider validation issues when refreshing
+        await validateEmbeddingProviders(this.validationWarning);
+
+        // Get current note context if needed
+        const currentActiveNoteId = appContext.tabManager.getActiveContext()?.note?.noteId || null;
+
+        // If we're switching to a different note, we need to reset
+        if (this.currentNoteId !== currentActiveNoteId) {
+            console.log(`Note ID changed from ${this.currentNoteId} to ${currentActiveNoteId}, resetting chat panel`);
+
+            // Reset the UI and data
+            this.noteContextChatMessages.innerHTML = '';
+            this.messages = [];
+            this.chatNoteId = null;
+            this.noteId = null; // Also reset the chat note ID
+            this.hideSources(); // Hide any sources from previous note
+
+            // Update our current noteId
+            this.currentNoteId = currentActiveNoteId;
+        }
+
+        // Always try to load saved data for the current note
+        const hasSavedData = await this.loadSavedData();
+
+        // Only create a new session if we don't have a session or saved data
+        if (!this.chatNoteId || !this.noteId || !hasSavedData) {
+            // Create a new chat session
+            await this.createChatSession();
+        }
+    }
+
+    /**
+     * Create a new chat session
+     */
+    private async createChatSession() {
+        try {
+            // Create a new chat session, passing the current note ID if it exists
+            const { chatNoteId, noteId } = await createChatSession(
+                this.currentNoteId ? this.currentNoteId : undefined
+            );
+
+            if (chatNoteId) {
+                // If we got back an ID from the API, use it
+                this.chatNoteId = chatNoteId;
+
+                // For new sessions, the noteId should equal the chatNoteId
+                // This ensures we're using the note ID consistently
+                this.noteId = noteId || chatNoteId;
+
+                console.log(`Created new chat session with noteId: ${this.noteId}`);
+            } else {
+                throw new Error("Failed to create chat session - no ID returned");
+            }
+
+            // Save the note ID as the session identifier
+            await this.saveCurrentData();
+        } catch (error) {
+            console.error('Error creating chat session:', error);
+            toastService.showError('Failed to create chat session');
+        }
+    }
+
+    /**
+     * Handle sending a user message to the LLM service
+     */
+    private async sendMessage(content: string) {
+        if (!content.trim()) return;
+
+        // Add the user message to the UI and data model
+        this.addMessageToChat('user', content);
+        this.messages.push({
+            role: 'user',
+            content: content
+        });
+
+        // Save the data immediately after a user message
+        await this.saveCurrentData();
+
+        // Clear input and show loading state
+        this.noteContextChatInput.value = '';
+        showLoadingIndicator(this.loadingIndicator);
+        this.hideSources();
+
+        try {
+            const useAdvancedContext = this.useAdvancedContextCheckbox.checked;
+            const showThinking = this.showThinkingCheckbox.checked;
+
+            // Add logging to verify parameters
+            console.log(`Sending message with: useAdvancedContext=${useAdvancedContext}, showThinking=${showThinking}, noteId=${this.currentNoteId}, sessionId=${this.chatNoteId}`);
+
+            // Create the message parameters
+            const messageParams = {
+                content,
+                useAdvancedContext,
+                showThinking
+            };
+
+            // Try websocket streaming (preferred method)
+            try {
+                await this.setupStreamingResponse(messageParams);
+            } catch (streamingError) {
+                console.warn("WebSocket streaming failed, falling back to direct response:", streamingError);
+
+                // If streaming fails, fall back to direct response
+                const handled = await this.handleDirectResponse(messageParams);
+                if (!handled) {
+                    // If neither method works, show an error
+                    throw new Error("Failed to get response from server");
+                }
+            }
+
+            // Note: We don't need to save here since the streaming completion and direct response methods
+            // both call saveCurrentData() when they're done
+        } catch (error) {
+            console.error('Error processing user message:', error);
+            toastService.showError('Failed to process message');
+
+            // Add a generic error message to the UI
+            this.addMessageToChat('assistant', 'Sorry, I encountered an error processing your message. Please try again.');
+            this.messages.push({
+                role: 'assistant',
+                content: 'Sorry, I encountered an error processing your message. Please try again.'
+            });
+
+            // Save the data even after error
+            await this.saveCurrentData();
+        }
+    }
+
+    /**
+     * Process a new user message - add to UI and save
+     */
+    private async processUserMessage(content: string) {
+        // Check for validation issues first
+        await validateEmbeddingProviders(this.validationWarning);
+
+        // Make sure we have a valid session
+        if (!this.chatNoteId) {
+            // If no session ID, create a new session
+            await this.createChatSession();
+
+            if (!this.chatNoteId) {
+                // If still no session ID, show error and return
+                console.error("Failed to create chat session");
+                toastService.showError("Failed to create chat session");
+                return;
+            }
+        }
+
+        // Add user message to messages array if not already added
+        if (!this.messages.some(msg => msg.role === 'user' && msg.content === content)) {
+            this.messages.push({
+                role: 'user',
+                content: content
+            });
+        }
+
+        // Clear input and show loading state
+        this.noteContextChatInput.value = '';
+        showLoadingIndicator(this.loadingIndicator);
+        this.hideSources();
+
+        try {
+            const useAdvancedContext = this.useAdvancedContextCheckbox.checked;
+            const showThinking = this.showThinkingCheckbox.checked;
+
+            // Save current state to the Chat Note before getting a response
+            await this.saveCurrentData();
+
+            // Add logging to verify parameters
+            console.log(`Sending message with: useAdvancedContext=${useAdvancedContext}, showThinking=${showThinking}, noteId=${this.currentNoteId}, sessionId=${this.chatNoteId}`);
+
+            // Create the message parameters
+            const messageParams = {
+                content,
+                useAdvancedContext,
+                showThinking
+            };
+
+            // Try websocket streaming (preferred method)
+            try {
+                await this.setupStreamingResponse(messageParams);
+            } catch (streamingError) {
+                console.warn("WebSocket streaming failed, falling back to direct response:", streamingError);
+
+                // If streaming fails, fall back to direct response
+                const handled = await this.handleDirectResponse(messageParams);
+                if (!handled) {
+                    // If neither method works, show an error
+                    throw new Error("Failed to get response from server");
+                }
+            }
+
+            // Save final state after getting the response
+            await this.saveCurrentData();
+        } catch (error) {
+            this.handleError(error as Error);
+            // Make sure we save the current state even on error
+            await this.saveCurrentData();
+        }
+    }
+
+    /**
+     * Try to get a direct response from the server
+     */
+    private async handleDirectResponse(messageParams: any): Promise<boolean> {
+        try {
+            if (!this.chatNoteId) return false;
+
+            console.log(`Getting direct response using sessionId: ${this.chatNoteId} (noteId: ${this.noteId})`);
+
+            // Get a direct response from the server
+            const postResponse = await getDirectResponse(this.chatNoteId, messageParams);
+
+            // If the POST request returned content directly, display it
+            if (postResponse && postResponse.content) {
+                // Store metadata from the response
+                if (postResponse.metadata) {
+                    console.log("Received metadata from response:", postResponse.metadata);
+                    this.metadata = {
+                        ...this.metadata,
+                        ...postResponse.metadata
+                    };
+                }
+
+                // Store sources from the response
+                if (postResponse.sources && postResponse.sources.length > 0) {
+                    console.log(`Received ${postResponse.sources.length} sources from response`);
+                    this.sources = postResponse.sources;
+                    this.showSources(postResponse.sources);
+                }
+
+                // Process the assistant response
+                this.processAssistantResponse(postResponse.content, postResponse);
+
+                hideLoadingIndicator(this.loadingIndicator);
+                return true;
+            }
+
+            return false;
+        } catch (error) {
+            console.error("Error with direct response:", error);
+            return false;
+        }
+    }
+
+    /**
+     * Process an assistant response - add to UI and save
+     */
+    private async processAssistantResponse(content: string, fullResponse?: any) {
+        // Add the response to the chat UI
+        this.addMessageToChat('assistant', content);
+
+        // Add to our local message array too
+        this.messages.push({
+            role: 'assistant',
+            content,
+            timestamp: new Date()
+        });
+
+        // If we received tool execution information, add it to metadata
+        if (fullResponse?.metadata?.toolExecutions) {
+            console.log(`Storing ${fullResponse.metadata.toolExecutions.length} tool executions from response`);
+            // Make sure our metadata has toolExecutions
+            if (!this.metadata.toolExecutions) {
+                this.metadata.toolExecutions = [];
+            }
+
+            // Add new tool executions
+            this.metadata.toolExecutions = [
+                ...this.metadata.toolExecutions,
+                ...fullResponse.metadata.toolExecutions
+            ];
+        }
+
+        // Save to note
+        this.saveCurrentData().catch(err => {
+            console.error("Failed to save assistant response to note:", err);
+        });
+    }
+
+    /**
+     * Set up streaming response via WebSocket
+     */
+    private async setupStreamingResponse(messageParams: any): Promise<void> {
+        if (!this.chatNoteId) {
+            throw new Error("No session ID available");
+        }
+
+        console.log(`Setting up streaming response using sessionId: ${this.chatNoteId} (noteId: ${this.noteId})`);
+
+        // Store tool executions captured during streaming
+        const toolExecutionsCache: Array<{
+            id: string;
+            name: string;
+            arguments: any;
+            result: any;
+            error?: string;
+            timestamp: string;
+        }> = [];
+
+        return setupStreamingResponse(
+            this.chatNoteId,
+            messageParams,
+            // Content update handler
+            (content: string, isDone: boolean = false) => {
+                this.updateStreamingUI(content, isDone);
+
+                // Update session data with additional metadata when streaming is complete
+                if (isDone) {
+                    // Update our metadata with info from the server
+                    server.get<{
+                        metadata?: {
+                            model?: string;
+                            provider?: string;
+                            temperature?: number;
+                            maxTokens?: number;
+                            toolExecutions?: Array<{
+                                id: string;
+                                name: string;
+                                arguments: any;
+                                result: any;
+                                error?: string;
+                                timestamp: string;
+                            }>;
+                            lastUpdated?: string;
+                            usage?: {
+                                promptTokens?: number;
+                                completionTokens?: number;
+                                totalTokens?: number;
+                            };
+                        };
+                        sources?: Array<{
+                            noteId: string;
+                            title: string;
+                            similarity?: number;
+                            content?: string;
+                        }>;
+                    }>(`llm/chat/${this.chatNoteId}`)
+                        .then((sessionData) => {
+                            console.log("Got updated session data:", sessionData);
+
+                            // Store metadata
+                            if (sessionData.metadata) {
+                                this.metadata = {
+                                    ...this.metadata,
+                                    ...sessionData.metadata
+                                };
+                            }
+
+                            // Store sources
+                            if (sessionData.sources && sessionData.sources.length > 0) {
+                                this.sources = sessionData.sources;
+                                this.showSources(sessionData.sources);
+                            }
+
+                            // Make sure we include the cached tool executions
+                            if (toolExecutionsCache.length > 0) {
+                                console.log(`Including ${toolExecutionsCache.length} cached tool executions in metadata`);
+                                if (!this.metadata.toolExecutions) {
+                                    this.metadata.toolExecutions = [];
+                                }
+
+                                // Add any tool executions from our cache that aren't already in metadata
+                                const existingIds = new Set((this.metadata.toolExecutions || []).map((t: {id: string}) => t.id));
+                                for (const toolExec of toolExecutionsCache) {
+                                    if (!existingIds.has(toolExec.id)) {
+                                        this.metadata.toolExecutions.push(toolExec);
+                                        existingIds.add(toolExec.id);
+                                    }
+                                }
+                            }
+
+                            // Save the updated data to the note
+                            this.saveCurrentData()
+                                .catch(err => console.error("Failed to save data after streaming completed:", err));
+                        })
+                        .catch(err => console.error("Error fetching session data after streaming:", err));
+                }
+            },
+            // Thinking update handler
+            (thinking: string) => {
+                this.showThinkingState(thinking);
+            },
+            // Tool execution handler
+            (toolData: any) => {
+                this.showToolExecutionInfo(toolData);
+
+                // Cache tools we see during streaming to include them in the final saved data
+                if (toolData && toolData.action === 'result' && toolData.tool) {
+                    // Create a tool execution record
+                    const toolExec = {
+                        id: toolData.toolCallId || `tool-${Date.now()}-${Math.random().toString(36).substring(2, 7)}`,
+                        name: toolData.tool,
+                        arguments: toolData.args || {},
+                        result: toolData.result || {},
+                        error: toolData.error,
+                        timestamp: new Date().toISOString()
+                    };
+
+                    // Add to both our local cache for immediate saving and to metadata for later saving
+                    toolExecutionsCache.push(toolExec);
+
+                    // Initialize toolExecutions array if it doesn't exist
+                    if (!this.metadata.toolExecutions) {
+                        this.metadata.toolExecutions = [];
+                    }
+
+                    // Add tool execution to our metadata
+                    this.metadata.toolExecutions.push(toolExec);
+
+                    console.log(`Cached tool execution for ${toolData.tool} to be saved later`);
+
+                    // Save immediately after receiving a tool execution
+                    // This ensures we don't lose tool execution data if streaming fails
+                    this.saveCurrentData().catch(err => {
+                        console.error("Failed to save tool execution data:", err);
+                    });
+                }
+            },
+            // Complete handler
+            () => {
+                hideLoadingIndicator(this.loadingIndicator);
+            },
+            // Error handler
+            (error: Error) => {
+                this.handleError(error);
+            }
+        );
+    }
+
+    /**
+     * Update the UI with streaming content
+     */
+    private updateStreamingUI(assistantResponse: string, isDone: boolean = false) {
+        // Get the existing assistant message or create a new one
+        let assistantMessageEl = this.noteContextChatMessages.querySelector('.assistant-message:last-child');
+
+        if (!assistantMessageEl) {
+            // If no assistant message yet, create one
+            assistantMessageEl = document.createElement('div');
+            assistantMessageEl.className = 'assistant-message message mb-3';
+            this.noteContextChatMessages.appendChild(assistantMessageEl);
+
+            // Add assistant profile icon
+            const profileIcon = document.createElement('div');
+            profileIcon.className = 'profile-icon';
+            profileIcon.innerHTML = '<i class="bx bx-bot"></i>';
+            assistantMessageEl.appendChild(profileIcon);
+
+            // Add message content container
+            const messageContent = document.createElement('div');
+            messageContent.className = 'message-content';
+            assistantMessageEl.appendChild(messageContent);
+        }
+
+        // Update the content
+        const messageContent = assistantMessageEl.querySelector('.message-content') as HTMLElement;
+        messageContent.innerHTML = formatMarkdown(assistantResponse);
+
+        // Apply syntax highlighting if this is the final update
+        if (isDone) {
+            applySyntaxHighlight($(assistantMessageEl as HTMLElement));
+
+            // Update message in the data model for storage
+            // Find the last assistant message to update, or add a new one if none exists
+            const assistantMessages = this.messages.filter(msg => msg.role === 'assistant');
+            const lastAssistantMsgIndex = assistantMessages.length > 0 ?
+                this.messages.lastIndexOf(assistantMessages[assistantMessages.length - 1]) : -1;
+
+            if (lastAssistantMsgIndex >= 0) {
+                // Update existing message
+                this.messages[lastAssistantMsgIndex].content = assistantResponse;
+            } else {
+                // Add new message
+                this.messages.push({
+                    role: 'assistant',
+                    content: assistantResponse
+                });
+            }
+
+            // Hide loading indicator
+            hideLoadingIndicator(this.loadingIndicator);
+
+            // Save the final state to the Chat Note
+            this.saveCurrentData().catch(err => {
+                console.error("Failed to save assistant response to note:", err);
+            });
+        }
+
+        // Scroll to bottom
+        this.chatContainer.scrollTop = this.chatContainer.scrollHeight;
+    }
+
+    /**
+     * Handle general errors in the send message flow
+     */
+    private handleError(error: Error) {
+        hideLoadingIndicator(this.loadingIndicator);
+        toastService.showError('Error sending message: ' + error.message);
+    }
+
+    private addMessageToChat(role: 'user' | 'assistant', content: string) {
+        addMessageToChat(this.noteContextChatMessages, this.chatContainer, role, content);
+    }
+
+    private showSources(sources: Array<{noteId: string, title: string}>) {
+        showSources(
+            this.sourcesList,
+            this.sourcesContainer,
+            this.sourcesCount,
+            sources,
+            (noteId: string) => {
+                // Open the note in a new tab but don't switch to it
+                appContext.tabManager.openTabWithNoteWithHoisting(noteId, { activate: false });
+            }
+        );
+    }
+
+    private hideSources() {
+        hideSources(this.sourcesContainer);
+    }
+
+    /**
+     * Handle tool execution updates
+     */
+    private showToolExecutionInfo(toolExecutionData: any) {
+        console.log(`Showing tool execution info: ${JSON.stringify(toolExecutionData)}`);
+
+        // Enhanced debugging for tool execution
+        if (!toolExecutionData) {
+            console.error('Tool execution data is missing or undefined');
+            return;
+        }
+
+        // Check for required properties
+        const actionType = toolExecutionData.action || '';
+        const toolName = toolExecutionData.tool || 'unknown';
+        console.log(`Tool execution details: action=${actionType}, tool=${toolName}, hasResult=${!!toolExecutionData.result}`);
+
+        // Force action to 'result' if missing but result is present
+        if (!actionType && toolExecutionData.result) {
+            console.log('Setting missing action to "result" since result is present');
+            toolExecutionData.action = 'result';
+        }
+
+        // Create or get the tool execution container
+        let toolExecutionElement = this.noteContextChatMessages.querySelector('.chat-tool-execution');
+        if (!toolExecutionElement) {
+            toolExecutionElement = document.createElement('div');
+            toolExecutionElement.className = 'chat-tool-execution mb-3';
+
+            // Create header with title and dropdown toggle
+            const header = document.createElement('div');
+            header.className = 'tool-execution-header d-flex align-items-center p-2 rounded';
+            header.innerHTML = `
+                <i class="bx bx-terminal me-2"></i>
+                <span class="flex-grow-1">Tool Execution</span>
+                <button type="button" class="btn btn-sm btn-link p-0 text-muted tool-execution-toggle" title="Toggle tool execution details">
+                    <i class="bx bx-chevron-down"></i>
+                </button>
+            `;
+            toolExecutionElement.appendChild(header);
+
+            // Create container for tool steps
+            const stepsContainer = document.createElement('div');
+            stepsContainer.className = 'tool-execution-container p-2 rounded mb-2';
+            toolExecutionElement.appendChild(stepsContainer);
+
+            // Add to chat messages
+            this.noteContextChatMessages.appendChild(toolExecutionElement);
+
+            // Add click handler for toggle button
+            const toggleButton = toolExecutionElement.querySelector('.tool-execution-toggle');
+            if (toggleButton) {
+                toggleButton.addEventListener('click', () => {
+                    const stepsContainer = toolExecutionElement?.querySelector('.tool-execution-container');
+                    const icon = toggleButton.querySelector('i');
+
+                    if (stepsContainer) {
+                        if (stepsContainer.classList.contains('collapsed')) {
+                            // Expand
+                            stepsContainer.classList.remove('collapsed');
+                            (stepsContainer as HTMLElement).style.display = 'block';
+                            if (icon) {
+                                icon.className = 'bx bx-chevron-down';
+                            }
+                        } else {
+                            // Collapse
+                            stepsContainer.classList.add('collapsed');
+                            (stepsContainer as HTMLElement).style.display = 'none';
+                            if (icon) {
+                                icon.className = 'bx bx-chevron-right';
+                            }
+                        }
+                    }
+                });
+            }
+
+            // Add click handler for the header to toggle expansion as well
+            header.addEventListener('click', (e) => {
+                // Only toggle if the click isn't on the toggle button itself
+                const target = e.target as HTMLElement;
+                if (target && !target.closest('.tool-execution-toggle')) {
+                    const toggleButton = toolExecutionElement?.querySelector('.tool-execution-toggle');
+                    toggleButton?.dispatchEvent(new Event('click'));
+                }
+            });
+            (header as HTMLElement).style.cursor = 'pointer';
+        }
+
+        // Get the steps container
+        const stepsContainer = toolExecutionElement.querySelector('.tool-execution-container');
+        if (!stepsContainer) return;
+
+        // Process based on action type
+        const action = toolExecutionData.action || '';
+
+        if (action === 'start' || action === 'executing') {
+            // Tool execution started
+            const step = document.createElement('div');
+            step.className = 'tool-step executing p-2 mb-2 rounded';
+            step.innerHTML = `
+                <div class="d-flex align-items-center">
+                    <i class="bx bx-code-block me-2"></i>
+                    <span>Executing tool: <strong>${toolExecutionData.tool || 'unknown'}</strong></span>
+                </div>
+                ${toolExecutionData.args ? `
+                <div class="tool-args mt-1 ps-3">
+                    <code>Args: ${JSON.stringify(toolExecutionData.args || {}, null, 2)}</code>
+                </div>` : ''}
+            `;
+            stepsContainer.appendChild(step);
+        }
+        else if (action === 'result' || action === 'complete') {
+            // Tool execution completed with results
+            const step = document.createElement('div');
+            step.className = 'tool-step result p-2 mb-2 rounded';
+
+            let resultDisplay = '';
+
+            // Special handling for note search tools which have a specific structure
+            if ((toolExecutionData.tool === 'search_notes' || toolExecutionData.tool === 'keyword_search_notes') &&
+                typeof toolExecutionData.result === 'object' &&
+                toolExecutionData.result.results) {
+
+                const results = toolExecutionData.result.results;
+
+                if (results.length === 0) {
+                    resultDisplay = `<div class="text-muted">No notes found matching the search criteria.</div>`;
+                } else {
+                    resultDisplay = `
+                        <div class="search-results">
+                            <div class="mb-2">Found ${results.length} notes:</div>
+                            <ul class="list-unstyled ps-1">
+                                ${results.map((note: any) => `
+                                    <li class="mb-1">
+                                        <a href="#" class="note-link" data-note-id="${note.noteId}">${note.title}</a>
+                                        ${note.similarity < 1 ? `<span class="text-muted small ms-1">(similarity: ${(note.similarity * 100).toFixed(0)}%)</span>` : ''}
+                                    </li>
+                                `).join('')}
+                            </ul>
+                        </div>
+                    `;
+                }
+            }
+            // Format the result based on type for other tools
+            else if (typeof toolExecutionData.result === 'object') {
+                // For objects, format as pretty JSON
+                resultDisplay = `<pre class="mb-0"><code>${JSON.stringify(toolExecutionData.result, null, 2)}</code></pre>`;
+            } else {
+                // For simple values, display as text
+                resultDisplay = `<div>${String(toolExecutionData.result)}</div>`;
+            }
+
+            step.innerHTML = `
+                <div class="d-flex align-items-center">
+                    <i class="bx bx-terminal me-2"></i>
+                    <span>Tool: <strong>${toolExecutionData.tool || 'unknown'}</strong></span>
+                </div>
+                <div class="tool-result mt-1 ps-3">
+                    ${resultDisplay}
+                </div>
+            `;
+            stepsContainer.appendChild(step);
+
+            // Add event listeners for note links if this is a note search result
+            if (toolExecutionData.tool === 'search_notes' || toolExecutionData.tool === 'keyword_search_notes') {
+                const noteLinks = step.querySelectorAll('.note-link');
+                noteLinks.forEach(link => {
+                    link.addEventListener('click', (e) => {
+                        e.preventDefault();
+                        const noteId = (e.currentTarget as HTMLElement).getAttribute('data-note-id');
+                        if (noteId) {
+                            // Open the note in a new tab but don't switch to it
+                            appContext.tabManager.openTabWithNoteWithHoisting(noteId, { activate: false });
+                        }
+                    });
+                });
+            }
+        }
+        else if (action === 'error') {
+            // Tool execution failed
+            const step = document.createElement('div');
+            step.className = 'tool-step error p-2 mb-2 rounded';
+            step.innerHTML = `
+                <div class="d-flex align-items-center">
+                    <i class="bx bx-error-circle me-2"></i>
+                    <span>Error in tool: <strong>${toolExecutionData.tool || 'unknown'}</strong></span>
+                </div>
+                <div class="tool-error mt-1 ps-3 text-danger">
+                    ${toolExecutionData.error || 'Unknown error'}
+                </div>
+            `;
+            stepsContainer.appendChild(step);
+        }
+        else if (action === 'generating') {
+            // Generating final response with tool results
+            const step = document.createElement('div');
+            step.className = 'tool-step generating p-2 mb-2 rounded';
+            step.innerHTML = `
+                <div class="d-flex align-items-center">
+                    <i class="bx bx-message-dots me-2"></i>
+                    <span>Generating response with tool results...</span>
+                </div>
+            `;
+            stepsContainer.appendChild(step);
+        }
+
+        // Make sure the loading indicator is shown during tool execution
+        this.loadingIndicator.style.display = 'flex';
+
+        // Scroll the chat container to show the tool execution
+        this.chatContainer.scrollTop = this.chatContainer.scrollHeight;
+    }
+
+    /**
+     * Show thinking state in the UI
+     */
+    private showThinkingState(thinkingData: string) {
+        // Thinking state is now updated via the in-chat UI in updateStreamingUI
+        // This method is now just a hook for the WebSocket handlers
+
+        // Show the loading indicator
+        this.loadingIndicator.style.display = 'flex';
+    }
+
+    private initializeEventListeners() {
+        this.noteContextChatForm.addEventListener('submit', (e) => {
+            e.preventDefault();
+            const content = this.noteContextChatInput.value;
+            this.sendMessage(content);
+        });
+
+        // Add auto-resize functionality to the textarea
+        this.noteContextChatInput.addEventListener('input', () => {
+            this.noteContextChatInput.style.height = 'auto';
+            this.noteContextChatInput.style.height = `${this.noteContextChatInput.scrollHeight}px`;
+        });
+
+        // Handle Enter key (send on Enter, new line on Shift+Enter)
+        this.noteContextChatInput.addEventListener('keydown', (e) => {
+            if (e.key === 'Enter' && !e.shiftKey) {
+                e.preventDefault();
+                this.noteContextChatForm.dispatchEvent(new Event('submit'));
+            }
+        });
+    }
+}
diff --git a/src/public/app/widgets/llm_chat/message_processor.ts b/src/public/app/widgets/llm_chat/message_processor.ts
new file mode 100644
index 000000000..139a3d611
--- /dev/null
+++ b/src/public/app/widgets/llm_chat/message_processor.ts
@@ -0,0 +1,59 @@
+/**
+ * Message processing functions for LLM Chat
+ */
+import type { ToolExecutionStep } from "./types.js";
+
+/**
+ * Extract tool execution steps from the DOM that are within the chat flow
+ */
+export function extractInChatToolSteps(chatMessagesElement: HTMLElement): ToolExecutionStep[] {
+    const steps: ToolExecutionStep[] = [];
+
+    // Look for tool execution in the chat flow
+    const toolExecutionElement = chatMessagesElement.querySelector('.chat-tool-execution');
+
+    if (toolExecutionElement) {
+        // Find all tool step elements
+        const stepElements = toolExecutionElement.querySelectorAll('.tool-step');
+
+        stepElements.forEach(stepEl => {
+            const stepHtml = stepEl.innerHTML;
+
+            // Determine the step type based on icons or classes present
+            let type = 'info';
+            let name: string | undefined;
+            let content = '';
+
+            if (stepHtml.includes('bx-code-block')) {
+                type = 'executing';
+                content = 'Executing tools...';
+            } else if (stepHtml.includes('bx-terminal')) {
+                type = 'result';
+                // Extract the tool name from the step
+                const nameMatch = stepHtml.match(/<span[^>]*>Tool: ([^<]+)<\/span>/);
+                name = nameMatch ? nameMatch[1] : 'unknown';
+
+                // Extract the content from the div with class mt-1 ps-3
+                const contentEl = stepEl.querySelector('.mt-1.ps-3');
+                content = contentEl ? contentEl.innerHTML : '';
+            } else if (stepHtml.includes('bx-error-circle')) {
+                type = 'error';
+                const nameMatch = stepHtml.match(/<span[^>]*>Tool: ([^<]+)<\/span>/);
+                name = nameMatch ? nameMatch[1] : 'unknown';
+
+                const contentEl = stepEl.querySelector('.mt-1.ps-3.text-danger');
+                content = contentEl ? contentEl.innerHTML : '';
+            } else if (stepHtml.includes('bx-message-dots')) {
+                type = 'generating';
+                content = 'Generating response with tool results...';
+            } else if (stepHtml.includes('bx-loader-alt')) {
+                // Skip the initializing spinner
+                return;
+            }
+
+            steps.push({ type, name, content });
+        });
+    }
+
+    return steps;
+}
diff --git a/src/public/app/widgets/llm_chat/types.ts b/src/public/app/widgets/llm_chat/types.ts
new file mode 100644
index 000000000..dc19f38d3
--- /dev/null
+++ b/src/public/app/widgets/llm_chat/types.ts
@@ -0,0 +1,55 @@
+/**
+ * Types for LLM Chat Panel
+ */
+
+export interface ChatResponse {
+    id: string;
+    messages: Array<{role: string; content: string}>;
+    sources?: Array<{noteId: string; title: string}>;
+}
+
+export interface SessionResponse {
+    id: string;
+    title: string;
+    noteId?: string;
+}
+
+export interface ToolExecutionStep {
+    type: string;
+    name?: string;
+    content: string;
+}
+
+export interface MessageData {
+    role: string;
+    content: string;
+    timestamp?: Date;
+}
+
+export interface ChatData {
+    messages: MessageData[];
+    chatNoteId: string | null;
+    noteId?: string | null;
+    toolSteps: ToolExecutionStep[];
+    sources?: Array<{
+        noteId: string;
+        title: string;
+        similarity?: number;
+        content?: string;
+    }>;
+    metadata?: {
+        model?: string;
+        provider?: string;
+        temperature?: number;
+        maxTokens?: number;
+        lastUpdated?: string;
+        toolExecutions?: Array<{
+            id: string;
+            name: string;
+            arguments: any;
+            result: any;
+            error?: string;
+            timestamp: string;
+        }>;
+    };
+}
diff --git a/src/public/app/widgets/llm_chat/ui.ts b/src/public/app/widgets/llm_chat/ui.ts
new file mode 100644
index 000000000..b4c9c9208
--- /dev/null
+++ b/src/public/app/widgets/llm_chat/ui.ts
@@ -0,0 +1,251 @@
+/**
+ * UI-related functions for LLM Chat
+ */
+import { t } from "../../services/i18n.js";
+import type { ToolExecutionStep } from "./types.js";
+import { formatMarkdown, applyHighlighting } from "./utils.js";
+
+// Template for the chat widget
+export const TPL = `
+<div class="note-context-chat h-100 w-100 d-flex flex-column">
+    <!-- Move validation warning outside the card with better styling -->
+    <div class="provider-validation-warning alert alert-warning m-2 border-left border-warning" style="display: none; padding-left: 15px; border-left: 4px solid #ffc107; background-color: rgba(255, 248, 230, 0.9); font-size: 0.9rem; box-shadow: 0 2px 5px rgba(0,0,0,0.05);"></div>
+
+    <div class="note-context-chat-container flex-grow-1 overflow-auto p-3">
+        <div class="note-context-chat-messages"></div>
+        <div class="loading-indicator" style="display: none;">
+            <div class="spinner-border spinner-border-sm text-primary" role="status">
+                <span class="visually-hidden">Loading...</span>
+            </div>
+            <span class="ms-2">${t('ai_llm.agent.processing')}</span>
+        </div>
+    </div>
+
+    <div class="sources-container p-2 border-top" style="display: none;">
+        <h6 class="m-0 p-1 d-flex align-items-center">
+            <i class="bx bx-link-alt me-1"></i> ${t('ai_llm.sources')}
+            <span class="badge bg-primary rounded-pill ms-2 sources-count"></span>
+        </h6>
+        <div class="sources-list mt-2"></div>
+    </div>
+
+    <form class="note-context-chat-form d-flex flex-column border-top p-2">
+        <div class="d-flex chat-input-container mb-2">
+            <textarea
+                class="form-control note-context-chat-input"
+                placeholder="${t('ai_llm.enter_message')}"
+                rows="2"
+            ></textarea>
+            <button type="submit" class="btn btn-primary note-context-chat-send-button ms-2 d-flex align-items-center justify-content-center">
+                <i class="bx bx-send"></i>
+            </button>
+        </div>
+        <div class="d-flex align-items-center context-option-container mt-1 justify-content-end">
+            <small class="text-muted me-auto fst-italic">Options:</small>
+            <div class="form-check form-switch me-3 small">
+                <input class="form-check-input use-advanced-context-checkbox" type="checkbox" id="useEnhancedContext" checked>
+                <label class="form-check-label small" for="useEnhancedContext" title="${t('ai.enhanced_context_description')}">
+                    ${t('ai_llm.use_enhanced_context')}
+                    <i class="bx bx-info-circle small text-muted"></i>
+                </label>
+            </div>
+            <div class="form-check form-switch small">
+                <input class="form-check-input show-thinking-checkbox" type="checkbox" id="showThinking">
+                <label class="form-check-label small" for="showThinking" title="${t('ai.show_thinking_description')}">
+                    ${t('ai_llm.show_thinking')}
+                    <i class="bx bx-info-circle small text-muted"></i>
+                </label>
+            </div>
+        </div>
+    </form>
+</div>
+`;
+
+/**
+ * Add a message to the chat UI
+ */
+export function addMessageToChat(messagesContainer: HTMLElement, chatContainer: HTMLElement, role: 'user' | 'assistant', content: string) {
+    const messageElement = document.createElement('div');
+    messageElement.className = `chat-message ${role}-message mb-3 d-flex`;
+
+    const avatarElement = document.createElement('div');
+    avatarElement.className = 'message-avatar d-flex align-items-center justify-content-center me-2';
+
+    if (role === 'user') {
+        avatarElement.innerHTML = '<i class="bx bx-user"></i>';
+        avatarElement.classList.add('user-avatar');
+    } else {
+        avatarElement.innerHTML = '<i class="bx bx-bot"></i>';
+        avatarElement.classList.add('assistant-avatar');
+    }
+
+    const contentElement = document.createElement('div');
+    contentElement.className = 'message-content p-3 rounded flex-grow-1';
+
+    if (role === 'user') {
+        contentElement.classList.add('user-content', 'bg-light');
+    } else {
+        contentElement.classList.add('assistant-content');
+    }
+
+    // Format the content with markdown
+    contentElement.innerHTML = formatMarkdown(content);
+
+    messageElement.appendChild(avatarElement);
+    messageElement.appendChild(contentElement);
+
+    messagesContainer.appendChild(messageElement);
+
+    // Apply syntax highlighting to any code blocks in the message
+    applyHighlighting(contentElement);
+
+    // Scroll to bottom
+    chatContainer.scrollTop = chatContainer.scrollHeight;
+}
+
+/**
+ * Show sources in the UI
+ */
+export function showSources(
+    sourcesList: HTMLElement,
+    sourcesContainer: HTMLElement,
+    sourcesCount: HTMLElement,
+    sources: Array<{noteId: string, title: string}>,
+    onSourceClick: (noteId: string) => void
+) {
+    sourcesList.innerHTML = '';
+    sourcesCount.textContent = sources.length.toString();
+
+    sources.forEach(source => {
+        const sourceElement = document.createElement('div');
+        sourceElement.className = 'source-item p-2 mb-1 border rounded d-flex align-items-center';
+
+        // Create the direct link to the note
+        sourceElement.innerHTML = `
+            <div class="d-flex align-items-center w-100">
+                <a href="#root/${source.noteId}"
+                   data-note-id="${source.noteId}"
+                   class="source-link text-truncate d-flex align-items-center"
+                   title="Open note: ${source.title}">
+                    <i class="bx bx-file-blank me-1"></i>
+                    <span class="source-title">${source.title}</span>
+                </a>
+            </div>`;
+
+        // Add click handler
+        sourceElement.querySelector('.source-link')?.addEventListener('click', (e) => {
+            e.preventDefault();
+            e.stopPropagation();
+            onSourceClick(source.noteId);
+            return false;
+        });
+
+        sourcesList.appendChild(sourceElement);
+    });
+
+    sourcesContainer.style.display = 'block';
+}
+
+/**
+ * Hide sources in the UI
+ */
+export function hideSources(sourcesContainer: HTMLElement) {
+    sourcesContainer.style.display = 'none';
+}
+
+/**
+ * Show loading indicator
+ */
+export function showLoadingIndicator(loadingIndicator: HTMLElement) {
+    const logId = `ui-${Date.now()}`;
+    console.log(`[${logId}] Showing loading indicator`);
+
+    try {
+        loadingIndicator.style.display = 'flex';
+        const forceUpdate = loadingIndicator.offsetHeight;
+        console.log(`[${logId}] Loading indicator initialized`);
+    } catch (err) {
+        console.error(`[${logId}] Error showing loading indicator:`, err);
+    }
+}
+
+/**
+ * Hide loading indicator
+ */
+export function hideLoadingIndicator(loadingIndicator: HTMLElement) {
+    const logId = `ui-${Date.now()}`;
+    console.log(`[${logId}] Hiding loading indicator`);
+
+    try {
+        loadingIndicator.style.display = 'none';
+        const forceUpdate = loadingIndicator.offsetHeight;
+        console.log(`[${logId}] Loading indicator hidden`);
+    } catch (err) {
+        console.error(`[${logId}] Error hiding loading indicator:`, err);
+    }
+}
+
+/**
+ * Render tool steps as HTML for display in chat
+ */
+export function renderToolStepsHtml(steps: ToolExecutionStep[]): string {
+    if (!steps || steps.length === 0) return '';
+
+    let html = '';
+
+    steps.forEach(step => {
+        let icon, labelClass, content;
+
+        switch (step.type) {
+            case 'executing':
+                icon = 'bx-code-block text-primary';
+                labelClass = '';
+                content = `<div class="d-flex align-items-center">
+                    <i class="bx ${icon} me-1"></i>
+                    <span>${step.content}</span>
+                </div>`;
+                break;
+
+            case 'result':
+                icon = 'bx-terminal text-success';
+                labelClass = 'fw-bold';
+                content = `<div class="d-flex align-items-center">
+                    <i class="bx ${icon} me-1"></i>
+                    <span class="${labelClass}">Tool: ${step.name || 'unknown'}</span>
+                </div>
+                <div class="mt-1 ps-3">${step.content}</div>`;
+                break;
+
+            case 'error':
+                icon = 'bx-error-circle text-danger';
+                labelClass = 'fw-bold text-danger';
+                content = `<div class="d-flex align-items-center">
+                    <i class="bx ${icon} me-1"></i>
+                    <span class="${labelClass}">Tool: ${step.name || 'unknown'}</span>
+                </div>
+                <div class="mt-1 ps-3 text-danger">${step.content}</div>`;
+                break;
+
+            case 'generating':
+                icon = 'bx-message-dots text-info';
+                labelClass = '';
+                content = `<div class="d-flex align-items-center">
+                    <i class="bx ${icon} me-1"></i>
+                    <span>${step.content}</span>
+                </div>`;
+                break;
+
+            default:
+                icon = 'bx-info-circle text-muted';
+                labelClass = '';
+                content = `<div class="d-flex align-items-center">
+                    <i class="bx ${icon} me-1"></i>
+                    <span>${step.content}</span>
+                </div>`;
+        }
+
+        html += `<div class="tool-step my-1">${content}</div>`;
+    });
+
+    return html;
+}
diff --git a/src/public/app/widgets/llm_chat/utils.ts b/src/public/app/widgets/llm_chat/utils.ts
new file mode 100644
index 000000000..f7a880d69
--- /dev/null
+++ b/src/public/app/widgets/llm_chat/utils.ts
@@ -0,0 +1,93 @@
+/**
+ * Utility functions for LLM Chat
+ */
+import { marked } from "marked";
+import { applySyntaxHighlight } from "../../services/syntax_highlight.js";
+
+/**
+ * Format markdown content for display
+ */
+export function formatMarkdown(content: string): string {
+    if (!content) return '';
+
+    // First, extract HTML thinking visualization to protect it from replacements
+    const thinkingBlocks: string[] = [];
+    let processedContent = content.replace(/<div class=['"](thinking-process|reasoning-process)['"][\s\S]*?<\/div>/g, (match) => {
+        const placeholder = `__THINKING_BLOCK_${thinkingBlocks.length}__`;
+        thinkingBlocks.push(match);
+        return placeholder;
+    });
+
+    // Use marked library to parse the markdown
+    const markedContent = marked(processedContent, {
+        breaks: true,   // Convert line breaks to <br>
+        gfm: true,      // Enable GitHub Flavored Markdown
+        silent: true    // Ignore errors
+    });
+
+    // Handle potential promise (though it shouldn't be with our options)
+    if (typeof markedContent === 'string') {
+        processedContent = markedContent;
+    } else {
+        console.warn('Marked returned a promise unexpectedly');
+        // Use the original content as fallback
+        processedContent = content;
+    }
+
+    // Restore thinking visualization blocks
+    thinkingBlocks.forEach((block, index) => {
+        processedContent = processedContent.replace(`__THINKING_BLOCK_${index}__`, block);
+    });
+
+    return processedContent;
+}
+
+/**
+ * Simple HTML escaping for safer content display
+ */
+export function escapeHtml(text: string): string {
+    if (typeof text !== 'string') {
+        text = String(text || '');
+    }
+
+    return text
+        .replace(/&/g, '&amp;')
+        .replace(/</g, '&lt;')
+        .replace(/>/g, '&gt;')
+        .replace(/"/g, '&quot;')
+        .replace(/'/g, '&#039;');
+}
+
+/**
+ * Apply syntax highlighting to content
+ */
+export function applyHighlighting(element: HTMLElement): void {
+    applySyntaxHighlight($(element));
+}
+
+/**
+ * Format tool arguments for display
+ */
+export function formatToolArgs(args: any): string {
+    if (!args || typeof args !== 'object') return '';
+
+    return Object.entries(args)
+        .map(([key, value]) => {
+            // Format the value based on its type
+            let displayValue;
+            if (typeof value === 'string') {
+                displayValue = value.length > 50 ? `"${value.substring(0, 47)}..."` : `"${value}"`;
+            } else if (value === null) {
+                displayValue = 'null';
+            } else if (Array.isArray(value)) {
+                displayValue = '[...]'; // Simplified array representation
+            } else if (typeof value === 'object') {
+                displayValue = '{...}'; // Simplified object representation
+            } else {
+                displayValue = String(value);
+            }
+
+            return `<span class="text-primary">${escapeHtml(key)}</span>: ${escapeHtml(displayValue)}`;
+        })
+        .join(', ');
+}
diff --git a/src/public/app/widgets/llm_chat/validation.ts b/src/public/app/widgets/llm_chat/validation.ts
new file mode 100644
index 000000000..294ae8018
--- /dev/null
+++ b/src/public/app/widgets/llm_chat/validation.ts
@@ -0,0 +1,104 @@
+/**
+ * Validation functions for LLM Chat
+ */
+import options from "../../services/options.js";
+import { getEmbeddingStats } from "./communication.js";
+
+/**
+ * Validate embedding providers configuration
+ */
+export async function validateEmbeddingProviders(validationWarning: HTMLElement): Promise<void> {
+    try {
+        // Check if AI is enabled
+        const aiEnabled = options.is('aiEnabled');
+        if (!aiEnabled) {
+            validationWarning.style.display = 'none';
+            return;
+        }
+
+        // Get provider precedence
+        const precedenceStr = options.get('aiProviderPrecedence') || 'openai,anthropic,ollama';
+        let precedenceList: string[] = [];
+
+        if (precedenceStr) {
+            if (precedenceStr.startsWith('[') && precedenceStr.endsWith(']')) {
+                precedenceList = JSON.parse(precedenceStr);
+            } else if (precedenceStr.includes(',')) {
+                precedenceList = precedenceStr.split(',').map(p => p.trim());
+            } else {
+                precedenceList = [precedenceStr];
+            }
+        }
+
+        // Get enabled providers - this is a simplification since we don't have direct DB access
+        // We'll determine enabled status based on the presence of keys or settings
+        const enabledProviders: string[] = [];
+
+        // OpenAI is enabled if API key is set
+        const openaiKey = options.get('openaiApiKey');
+        if (openaiKey) {
+            enabledProviders.push('openai');
+        }
+
+        // Anthropic is enabled if API key is set
+        const anthropicKey = options.get('anthropicApiKey');
+        if (anthropicKey) {
+            enabledProviders.push('anthropic');
+        }
+
+        // Ollama is enabled if base URL is set
+        const ollamaBaseUrl = options.get('ollamaBaseUrl');
+        if (ollamaBaseUrl) {
+            enabledProviders.push('ollama');
+        }
+
+        // Local is always available
+        enabledProviders.push('local');
+
+        // Perform validation checks
+        const allPrecedenceEnabled = precedenceList.every((p: string) => enabledProviders.includes(p));
+
+        // Get embedding queue status
+        const embeddingStats = await getEmbeddingStats() as {
+            success: boolean,
+            stats: {
+                totalNotesCount: number;
+                embeddedNotesCount: number;
+                queuedNotesCount: number;
+                failedNotesCount: number;
+                lastProcessedDate: string | null;
+                percentComplete: number;
+            }
+        };
+        const queuedNotes = embeddingStats?.stats?.queuedNotesCount || 0;
+        const hasEmbeddingsInQueue = queuedNotes > 0;
+
+        // Show warning if there are issues
+        if (!allPrecedenceEnabled || hasEmbeddingsInQueue) {
+            let message = '<i class="bx bx-error-circle me-2"></i><strong>AI Provider Configuration Issues</strong>';
+
+            message += '<ul class="mb-1 ps-4">';
+
+            if (!allPrecedenceEnabled) {
+                const disabledProviders = precedenceList.filter((p: string) => !enabledProviders.includes(p));
+                message += `<li>The following providers in your precedence list are not enabled: ${disabledProviders.join(', ')}.</li>`;
+            }
+
+            if (hasEmbeddingsInQueue) {
+                message += `<li>Currently processing embeddings for ${queuedNotes} notes. Some AI features may produce incomplete results until processing completes.</li>`;
+            }
+
+            message += '</ul>';
+            message += '<div class="mt-2"><a href="javascript:" class="settings-link btn btn-sm btn-outline-secondary"><i class="bx bx-cog me-1"></i>Open AI Settings</a></div>';
+
+            // Update HTML content
+            validationWarning.innerHTML = message;
+            validationWarning.style.display = 'block';
+        } else {
+            validationWarning.style.display = 'none';
+        }
+    } catch (error) {
+        console.error('Error validating embedding providers:', error);
+        validationWarning.style.display = 'none';
+    }
+}
diff --git a/src/public/app/widgets/llm_chat_panel.ts b/src/public/app/widgets/llm_chat_panel.ts
new file mode 100644
index 000000000..fd26850cc
--- /dev/null
+++ b/src/public/app/widgets/llm_chat_panel.ts
@@ -0,0 +1,7 @@
+/**
+ * LLM Chat Panel Widget
+ * This file is preserved for backward compatibility.
+ * The actual implementation has been moved to the llm_chat/ folder.
+ */
+import LlmChatPanel from './llm_chat/index.js';
+export default LlmChatPanel;
diff --git a/src/public/app/widgets/note_detail.ts b/src/public/app/widgets/note_detail.ts
index 9341e89c4..238683809 100644
--- a/src/public/app/widgets/note_detail.ts
+++ b/src/public/app/widgets/note_detail.ts
@@ -36,6 +36,7 @@ import utils from "../services/utils.js";
 import type { NoteType } from "../entities/fnote.js";
 import type TypeWidget from "./type_widgets/type_widget.js";
 import { MermaidTypeWidget } from "./type_widgets/mermaid.js";
+import AiChatTypeWidget from "./type_widgets/ai_chat.js";
 
 const TPL = /*html*/`
 <div class="note-detail">
@@ -74,6 +75,7 @@ const typeWidgetClasses = {
     attachmentList: AttachmentListTypeWidget,
     mindMap: MindMapWidget,
     geoMap: GeoMapTypeWidget,
+    aiChat: AiChatTypeWidget,
 
     // Split type editors
     mermaid: MermaidTypeWidget
@@ -92,7 +94,8 @@ type ExtendedNoteType =
     | "editableCode"
     | "attachmentDetail"
     | "attachmentList"
-    | "protectedSession";
+    | "protectedSession"
+    | "aiChat";
 
 export default class NoteDetailWidget extends NoteContextAwareWidget {
 
@@ -215,12 +218,11 @@ export default class NoteDetailWidget extends NoteContextAwareWidget {
 
     async getWidgetType(): Promise<ExtendedNoteType> {
         const note = this.note;
-
         if (!note) {
             return "empty";
         }
 
-        let type: NoteType = note.type;
+        const type = note.type;
         let resultingType: ExtendedNoteType;
         const viewScope = this.noteContext?.viewScope;
 
diff --git a/src/public/app/widgets/note_type.ts b/src/public/app/widgets/note_type.ts
index 28983286c..63190f208 100644
--- a/src/public/app/widgets/note_type.ts
+++ b/src/public/app/widgets/note_type.ts
@@ -38,6 +38,7 @@ const NOTE_TYPES: NoteTypeMapping[] = [
     // Misc note types
     { type: "render", mime: "", title: t("note_types.render-note"), selectable: true },
     { type: "webView", mime: "", title: t("note_types.web-view"), selectable: true },
+    { type: "aiChat", mime: "application/json", title: t("note_types.ai-chat"), selectable: true },
 
     // Code notes
     { type: "code", mime: "text/plain", title: t("note_types.code"), selectable: true },
diff --git a/src/public/app/widgets/tab_aware_widget.js b/src/public/app/widgets/tab_aware_widget.js
new file mode 100644
index 000000000..c6f8e4450
--- /dev/null
+++ b/src/public/app/widgets/tab_aware_widget.js
@@ -0,0 +1,53 @@
+import BasicWidget from "./basic_widget.js";
+
+/**
+ * Base class for widgets that need to track the active tab/note
+ */
+export default class TabAwareWidget extends BasicWidget {
+    constructor() {
+        super();
+        this.noteId = null;
+        this.noteType = null;
+        this.notePath = null;
+        this.isActiveTab = false;
+    }
+
+    /**
+     * Called when the active note is switched
+     *
+     * @param {string} noteId
+     * @param {string|null} noteType
+     * @param {string|null} notePath
+     */
+    async noteSwitched(noteId, noteType, notePath) {
+        this.noteId = noteId;
+        this.noteType = noteType;
+        this.notePath = notePath;
+    }
+
+    /**
+     * Called when the widget's tab becomes active or inactive
+     *
+     * @param {boolean} active
+     */
+    activeTabChanged(active) {
+        this.isActiveTab = active;
+    }
+
+    /**
+     * Called when entities (notes, attributes, etc.) are reloaded
+     */
+    entitiesReloaded() {}
+
+    /**
+     * Check if this widget is enabled
+     */
+    isEnabled() {
+        return true;
+    }
+
+    /**
+     * Refresh widget with current data
+     */
+    async refresh() {}
+}
diff --git a/src/public/app/widgets/type_widgets/ai_chat.ts b/src/public/app/widgets/type_widgets/ai_chat.ts
new file mode 100644
index 000000000..e96cf5f20
--- /dev/null
+++ b/src/public/app/widgets/type_widgets/ai_chat.ts
@@ -0,0 +1,255 @@
+import TypeWidget from "./type_widget.js";
+import LlmChatPanel from "../llm_chat_panel.js";
+import { type EventData } from "../../components/app_context.js";
+import type FNote from "../../entities/fnote.js";
+import server from "../../services/server.js";
+import toastService from "../../services/toast.js";
+
+export default class AiChatTypeWidget extends TypeWidget {
+    private llmChatPanel: LlmChatPanel;
+    private isInitialized: boolean = false;
+    private initPromise: Promise<void> | null = null;
+
+    constructor() {
+        super();
+        this.llmChatPanel = new LlmChatPanel();
+
+        // Connect the data callbacks
+        this.llmChatPanel.setDataCallbacks(
+            (data) => this.saveData(data),
+            () => this.getData()
+        );
+    }
+
+    static getType() {
+        return "aiChat";
+    }
+
+    doRender() {
+        this.$widget = $('<div class="ai-chat-widget-container" style="height: 100%;"></div>');
+        this.$widget.append(this.llmChatPanel.render());
+
+        return this.$widget;
+    }
+
+    // Override the refreshWithNote method to ensure we get note changes
+    async refreshWithNote(note: FNote | null | undefined) {
+        console.log("refreshWithNote called for note:", note?.noteId);
+
+        // Always force a refresh when the note changes
+        if (this.note?.noteId !== note?.noteId) {
+            console.log(`Note ID changed from ${this.note?.noteId} to ${note?.noteId}, forcing reset`);
+            this.isInitialized = false;
+            this.initPromise = null;
+
+            // Force refresh the chat panel with the new note
+            if (note) {
+                this.llmChatPanel.setCurrentNoteId(note.noteId);
+            }
+        }
+
+        // Continue with regular doRefresh
+        await this.doRefresh(note);
+    }
+
+    async doRefresh(note: FNote | null | undefined) {
+        try {
+            console.log("doRefresh called for note:", note?.noteId);
+
+            // If we're already initializing, wait for that to complete
+            if (this.initPromise) {
+                await this.initPromise;
+                return;
+            }
+
+            // Initialize once or when note changes
+            if (!this.isInitialized) {
+                console.log("Initializing AI Chat Panel for note:", note?.noteId);
+
+                // Initialize the note content first
+                if (note) {
+                    try {
+                        const content = await note.getContent();
+                        // Check if content is empty
+                        if (!content || content === '{}') {
+                            // Initialize with empty chat history
+                            await this.saveData({
+                                messages: [],
+                                title: note.title,
+                                noteId: note.noteId // Store the note ID in the data
+                            });
+                            console.log("Initialized empty chat history for new note");
+                        } else {
+                            console.log("Note already has content, will load in LlmChatPanel.refresh()");
+                        }
+                    } catch (e) {
+                        console.error("Error initializing AI Chat note content:", e);
+                    }
+                }
+
+                // Create a promise to track initialization
+                this.initPromise = (async () => {
+                    try {
+                        // Reset the UI before refreshing
+                        this.llmChatPanel.clearNoteContextChatMessages();
+                        this.llmChatPanel.setMessages([]);
+
+                        // This will load saved data via the getData callback
+                        await this.llmChatPanel.refresh();
+                        this.isInitialized = true;
+                    } catch (e) {
+                        console.error("Error initializing LlmChatPanel:", e);
+                        toastService.showError("Failed to initialize chat panel. Try reloading.");
+                    }
+                })();
+
+                await this.initPromise;
+                this.initPromise = null;
+            }
+        } catch (e) {
+            console.error("Error in doRefresh:", e);
+            toastService.showError("Error refreshing chat. Please try again.");
+        }
+    }
+
+    async entitiesReloadedEvent(data: EventData<"entitiesReloaded">) {
+        // We don't need to refresh on entities reloaded for the chat
+    }
+
+    async noteSwitched() {
+        console.log("Note switched to:", this.noteId);
+
+        // Force a full reset when switching notes
+        this.isInitialized = false;
+        this.initPromise = null;
+
+        if (this.note) {
+            // Update the chat panel with the new note ID before refreshing
+            this.llmChatPanel.setCurrentNoteId(this.note.noteId);
+
+            // Reset the chat panel UI
+            this.llmChatPanel.clearNoteContextChatMessages();
+            this.llmChatPanel.setMessages([]);
+            this.llmChatPanel.setChatNoteId(null);
+        }
+
+        // Call the parent method to refresh
+        await super.noteSwitched();
+    }
+
+    async activeContextChangedEvent(data: EventData<"activeContextChanged">) {
+        if (!this.isActive()) {
+            return;
+        }
+
+        console.log("Active context changed, refreshing AI Chat Panel");
+
+        // Always refresh when we become active - this ensures we load the correct note data
+        try {
+            // Reset initialization flag to force a refresh
+            this.isInitialized = false;
+
+            // Make sure the chat panel has the current note ID
+            if (this.note) {
+                this.llmChatPanel.setCurrentNoteId(this.note.noteId);
+            }
+
+            this.initPromise = (async () => {
+                try {
+                    // Reset the UI before refreshing
+                    this.llmChatPanel.clearNoteContextChatMessages();
+                    this.llmChatPanel.setMessages([]);
+
+                    await this.llmChatPanel.refresh();
+                    this.isInitialized = true;
+                } catch (e) {
+                    console.error("Error refreshing LlmChatPanel:", e);
+                }
+            })();
+
+            await this.initPromise;
+            this.initPromise = null;
+        } catch (e) {
+            console.error("Error in activeContextChangedEvent:", e);
+        }
+    }
+
+    // Save chat data to the note
+    async saveData(data: any) {
+        if (!this.note) {
+            return;
+        }
+
+        try {
+            console.log(`AiChatTypeWidget: Saving data for note ${this.note.noteId}`);
+
+            // Format the data properly - this is the canonical format of the data
+            const formattedData = {
+                messages: data.messages || [],
+                chatNoteId: data.chatNoteId || this.note.noteId,
+                toolSteps: data.toolSteps || [],
+                sources: data.sources || [],
+                metadata: {
+                    ...(data.metadata || {}),
+                    lastUpdated: new Date().toISOString()
+                }
+            };
+
+            // Save the data to the note
+            await server.put(`notes/${this.note.noteId}/data`, {
+                content: JSON.stringify(formattedData, null, 2)
+            });
+        } catch (e) {
+            console.error("Error saving AI Chat data:", e);
+            toastService.showError("Failed to save chat data");
+        }
+    }
+
+    // Get data from the note
+    async getData() {
+        if (!this.note) {
+            return null;
+        }
+
+        try {
+            console.log(`AiChatTypeWidget: Getting data for note ${this.note.noteId}`);
+            const content = await this.note.getContent();
+
+            if (!content) {
+                console.log("Note content is empty");
+                return null;
+            }
+
+            // Parse the content as JSON
+            let parsedContent;
+            try {
+                parsedContent = JSON.parse(content as string);
+                console.log("Successfully parsed note content as JSON");
+            } catch (e) {
+                console.error("Error parsing chat content as JSON:", e);
+                return null;
+            }
+
+            // Check if this is a blob response with 'content' property that needs to be parsed again
+            // This happens when the content is returned from the /blob endpoint
+            if (parsedContent.content && typeof parsedContent.content === 'string' &&
+                parsedContent.blobId && parsedContent.contentLength) {
+                try {
+                    // The actual chat data is inside the 'content' property as a string
+                    console.log("Detected blob response structure, parsing inner content");
+                    const innerContent = JSON.parse(parsedContent.content);
+                    console.log("Successfully parsed blob inner content");
+                    return innerContent;
+                } catch (innerError) {
+                    console.error("Error parsing inner blob content:", innerError);
+                    return null;
+                }
+            }
+
+            return parsedContent;
+        } catch (e) {
+            console.error("Error loading AI Chat data:", e);
+            return null;
+        }
+    }
+}
diff --git a/src/public/app/widgets/type_widgets/content_widget.ts b/src/public/app/widgets/type_widgets/content_widget.ts
index 6fd3b360a..45af111e0 100644
--- a/src/public/app/widgets/type_widgets/content_widget.ts
+++ b/src/public/app/widgets/type_widgets/content_widget.ts
@@ -37,6 +37,7 @@ import LocalizationOptions from "./options/i18n/i18n.js";
 import CodeBlockOptions from "./options/appearance/code_block.js";
 import EditorOptions from "./options/text_notes/editor.js";
 import ShareSettingsOptions from "./options/other/share_settings.js";
+import AiSettingsOptions from "./options/ai_settings.js";
 import type FNote from "../../entities/fnote.js";
 import type NoteContextAwareWidget from "../note_context_aware_widget.js";
 import { t } from "i18next";
@@ -111,6 +112,7 @@ const CONTENT_WIDGETS: Record<string, (typeof NoteContextAwareWidget)[]> = {
     _optionsSync: [
         SyncOptions
     ],
+    _optionsAi: [AiSettingsOptions],
     _optionsOther: [
         SearchEngineOptions,
         TrayOptions,
diff --git a/src/public/app/widgets/type_widgets/options/ai_settings.ts b/src/public/app/widgets/type_widgets/options/ai_settings.ts
new file mode 100644
index 000000000..ca8753f2a
--- /dev/null
+++ b/src/public/app/widgets/type_widgets/options/ai_settings.ts
@@ -0,0 +1,2 @@
+import AiSettingsWidget from './ai_settings/index.js';
+export default AiSettingsWidget;
\ No newline at end of file
diff --git a/src/public/app/widgets/type_widgets/options/ai_settings/ai_settings_widget.ts b/src/public/app/widgets/type_widgets/options/ai_settings/ai_settings_widget.ts
new file mode 100644
index 000000000..269b958ba
--- /dev/null
+++ b/src/public/app/widgets/type_widgets/options/ai_settings/ai_settings_widget.ts
@@ -0,0 +1,510 @@
+import OptionsWidget from "../options_widget.js";
+import { TPL } from "./template.js";
+import { t } from "../../../../services/i18n.js";
+import type { OptionDefinitions, OptionMap } from "../../../../../../services/options_interface.js";
+import server from "../../../../services/server.js";
+import toastService from "../../../../services/toast.js";
+import type { EmbeddingStats, FailedEmbeddingNotes } from "./interfaces.js";
+import { ProviderService } from "./providers.js";
+
+export default class AiSettingsWidget extends OptionsWidget {
+    private ollamaModelsRefreshed = false;
+    private openaiModelsRefreshed = false;
+    private anthropicModelsRefreshed = false;
+    private statsRefreshInterval: NodeJS.Timeout | null = null;
+    private indexRebuildRefreshInterval: NodeJS.Timeout | null = null;
+    private readonly STATS_REFRESH_INTERVAL = 5000; // 5 seconds
+    private providerService: ProviderService | null = null;
+
+    doRender() {
+        this.$widget = $(TPL);
+        this.providerService = new ProviderService(this.$widget);
+
+        // Setup event handlers for options
+        this.setupEventHandlers();
+
+        this.refreshEmbeddingStats();
+        this.fetchFailedEmbeddingNotes();
+
+        return this.$widget;
+    }
+
+    /**
+     * Helper method to set up a change event handler for an option
+     * @param selector The jQuery selector for the element
+     * @param optionName The name of the option to update
+     * @param validateAfter Whether to run validation after the update
+     * @param isCheckbox Whether the element is a checkbox
+     */
+    setupChangeHandler(selector: string, optionName: keyof OptionDefinitions, validateAfter: boolean = false, isCheckbox: boolean = false) {
+        if (!this.$widget) return;
+
+        const $element = this.$widget.find(selector);
+        $element.on('change', async () => {
+            let value: string;
+
+            if (isCheckbox) {
+                value = $element.prop('checked') ? 'true' : 'false';
+            } else {
+                value = $element.val() as string;
+            }
+
+            await this.updateOption(optionName, value);
+
+            if (validateAfter) {
+                await this.displayValidationWarnings();
+            }
+        });
+    }
+
+    /**
+     * Set up all event handlers for options
+     */
+    setupEventHandlers() {
+        if (!this.$widget) return;
+
+        // Core AI options
+        this.setupChangeHandler('.ai-enabled', 'aiEnabled', true, true);
+        this.setupChangeHandler('.ai-provider-precedence', 'aiProviderPrecedence', true);
+        this.setupChangeHandler('.ai-temperature', 'aiTemperature');
+        this.setupChangeHandler('.ai-system-prompt', 'aiSystemPrompt');
+
+        // OpenAI options
+        this.setupChangeHandler('.openai-api-key', 'openaiApiKey', true);
+        this.setupChangeHandler('.openai-base-url', 'openaiBaseUrl', true);
+        this.setupChangeHandler('.openai-default-model', 'openaiDefaultModel');
+        this.setupChangeHandler('.openai-embedding-model', 'openaiEmbeddingModel');
+
+        // Anthropic options
+        this.setupChangeHandler('.anthropic-api-key', 'anthropicApiKey', true);
+        this.setupChangeHandler('.anthropic-default-model', 'anthropicDefaultModel');
+        this.setupChangeHandler('.anthropic-base-url', 'anthropicBaseUrl');
+
+        // Voyage options
+        this.setupChangeHandler('.voyage-api-key', 'voyageApiKey');
+        this.setupChangeHandler('.voyage-embedding-model', 'voyageEmbeddingModel');
+
+        // Ollama options
+        this.setupChangeHandler('.ollama-base-url', 'ollamaBaseUrl');
+        this.setupChangeHandler('.ollama-default-model', 'ollamaDefaultModel');
+        this.setupChangeHandler('.ollama-embedding-model', 'ollamaEmbeddingModel');
+
+        const $refreshModels = this.$widget.find('.refresh-models');
+        $refreshModels.on('click', async () => {
+            this.ollamaModelsRefreshed = await this.providerService?.refreshOllamaModels(true, this.ollamaModelsRefreshed) || false;
+        });
+
+        // Add tab change handler for Ollama tab
+        const $ollamaTab = this.$widget.find('#nav-ollama-tab');
+        $ollamaTab.on('shown.bs.tab', async () => {
+            // Only refresh the models if we haven't done it before
+            this.ollamaModelsRefreshed = await this.providerService?.refreshOllamaModels(false, this.ollamaModelsRefreshed) || false;
+        });
+
+        // OpenAI models refresh button
+        const $refreshOpenAIModels = this.$widget.find('.refresh-openai-models');
+        $refreshOpenAIModels.on('click', async () => {
+            this.openaiModelsRefreshed = await this.providerService?.refreshOpenAIModels(true, this.openaiModelsRefreshed) || false;
+        });
+
+        // Add tab change handler for OpenAI tab
+        const $openaiTab = this.$widget.find('#nav-openai-tab');
+        $openaiTab.on('shown.bs.tab', async () => {
+            // Only refresh the models if we haven't done it before
+            this.openaiModelsRefreshed = await this.providerService?.refreshOpenAIModels(false, this.openaiModelsRefreshed) || false;
+        });
+
+        // Anthropic models refresh button
+        const $refreshAnthropicModels = this.$widget.find('.refresh-anthropic-models');
+        $refreshAnthropicModels.on('click', async () => {
+            this.anthropicModelsRefreshed = await this.providerService?.refreshAnthropicModels(true, this.anthropicModelsRefreshed) || false;
+        });
+
+        // Add tab change handler for Anthropic tab
+        const $anthropicTab = this.$widget.find('#nav-anthropic-tab');
+        $anthropicTab.on('shown.bs.tab', async () => {
+            // Only refresh the models if we haven't done it before
+            this.anthropicModelsRefreshed = await this.providerService?.refreshAnthropicModels(false, this.anthropicModelsRefreshed) || false;
+        });
+
+        // Embedding options event handlers
+        this.setupChangeHandler('.embedding-auto-update-enabled', 'embeddingAutoUpdateEnabled', false, true);
+        this.setupChangeHandler('.enable-automatic-indexing', 'enableAutomaticIndexing', false, true);
+        this.setupChangeHandler('.embedding-similarity-threshold', 'embeddingSimilarityThreshold');
+        this.setupChangeHandler('.max-notes-per-llm-query', 'maxNotesPerLlmQuery');
+        this.setupChangeHandler('.embedding-provider-precedence', 'embeddingProviderPrecedence', true);
+        this.setupChangeHandler('.embedding-dimension-strategy', 'embeddingDimensionStrategy');
+        this.setupChangeHandler('.embedding-batch-size', 'embeddingBatchSize');
+        this.setupChangeHandler('.embedding-update-interval', 'embeddingUpdateInterval');
+
+        // No sortable behavior needed anymore
+
+        // Embedding stats refresh button
+        const $refreshStats = this.$widget.find('.embedding-refresh-stats');
+        $refreshStats.on('click', async () => {
+            await this.refreshEmbeddingStats();
+            await this.fetchFailedEmbeddingNotes();
+        });
+
+        // Recreate embeddings button
+        const $recreateEmbeddings = this.$widget.find('.recreate-embeddings');
+        $recreateEmbeddings.on('click', async () => {
+            if (confirm(t("ai_llm.recreate_embeddings_confirm") || "Are you sure you want to recreate all embeddings? This may take a long time.")) {
+                try {
+                    await server.post('llm/embeddings/reprocess');
+                    toastService.showMessage(t("ai_llm.recreate_embeddings_started"));
+
+                    // Start progress polling
+                    this.pollIndexRebuildProgress();
+                } catch (e) {
+                    console.error('Error starting embeddings regeneration:', e);
+                    toastService.showError(t("ai_llm.recreate_embeddings_error"));
+                }
+            }
+        });
+
+        // Rebuild index button
+        const $rebuildIndex = this.$widget.find('.rebuild-embeddings-index');
+        $rebuildIndex.on('click', async () => {
+            try {
+                await server.post('llm/embeddings/rebuild-index');
+                toastService.showMessage(t("ai_llm.rebuild_index_started"));
+
+                // Start progress polling
+                this.pollIndexRebuildProgress();
+            } catch (e) {
+                console.error('Error starting index rebuild:', e);
+                toastService.showError(t("ai_llm.rebuild_index_error"));
+            }
+        });
+    }
+
+    /**
+     * Display warnings for validation issues with providers
+     */
+    async displayValidationWarnings() {
+        if (!this.$widget) return;
+
+        const $warningDiv = this.$widget.find('.provider-validation-warning');
+
+        // Check if AI is enabled
+        const aiEnabled = this.$widget.find('.ai-enabled').prop('checked');
+        if (!aiEnabled) {
+            $warningDiv.hide();
+            return;
+        }
+
+        // Get provider precedence
+        const providerPrecedence = (this.$widget.find('.ai-provider-precedence').val() as string || '').split(',');
+
+        // Check for OpenAI configuration if it's in the precedence list
+        const openaiWarnings = [];
+        if (providerPrecedence.includes('openai')) {
+            const openaiApiKey = this.$widget.find('.openai-api-key').val();
+            if (!openaiApiKey) {
+                openaiWarnings.push(t("ai_llm.empty_key_warning.openai"));
+            }
+        }
+
+        // Check for Anthropic configuration if it's in the precedence list
+        const anthropicWarnings = [];
+        if (providerPrecedence.includes('anthropic')) {
+            const anthropicApiKey = this.$widget.find('.anthropic-api-key').val();
+            if (!anthropicApiKey) {
+                anthropicWarnings.push(t("ai_llm.empty_key_warning.anthropic"));
+            }
+        }
+
+        // Check for Voyage configuration if it's in the precedence list
+        const voyageWarnings = [];
+        if (providerPrecedence.includes('voyage')) {
+            const voyageApiKey = this.$widget.find('.voyage-api-key').val();
+            if (!voyageApiKey) {
+                voyageWarnings.push(t("ai_llm.empty_key_warning.voyage"));
+            }
+        }
+
+        // Check for Ollama configuration if it's in the precedence list
+        const ollamaWarnings = [];
+        if (providerPrecedence.includes('ollama')) {
+            const ollamaBaseUrl = this.$widget.find('.ollama-base-url').val();
+            if (!ollamaBaseUrl) {
+                ollamaWarnings.push(t("ai_llm.ollama_no_url"));
+            }
+        }
+
+        // Similar checks for embeddings
+        const embeddingWarnings = [];
+        const embeddingsEnabled = this.$widget.find('.enable-automatic-indexing').prop('checked');
+
+        if (embeddingsEnabled) {
+            const embeddingProviderPrecedence = (this.$widget.find('.embedding-provider-precedence').val() as string || '').split(',');
+
+            if (embeddingProviderPrecedence.includes('openai') && !this.$widget.find('.openai-api-key').val()) {
+                embeddingWarnings.push(t("ai_llm.empty_key_warning.openai"));
+            }
+
+            if (embeddingProviderPrecedence.includes('voyage') && !this.$widget.find('.voyage-api-key').val()) {
+                embeddingWarnings.push(t("ai_llm.empty_key_warning.voyage"));
+            }
+
+            if (embeddingProviderPrecedence.includes('ollama') && !this.$widget.find('.ollama-base-url').val()) {
+                embeddingWarnings.push(t("ai_llm.empty_key_warning.ollama"));
+            }
+        }
+
+        // Combine all warnings
+        const allWarnings = [
+            ...openaiWarnings,
+            ...anthropicWarnings,
+            ...voyageWarnings,
+            ...ollamaWarnings,
+            ...embeddingWarnings
+        ];
+
+        // Show or hide warnings
+        if (allWarnings.length > 0) {
+            const warningHtml = '<strong>' + t("ai_llm.configuration_warnings") + '</strong><ul>' +
+                allWarnings.map(warning => `<li>${warning}</li>`).join('') + '</ul>';
+            $warningDiv.html(warningHtml).show();
+        } else {
+            $warningDiv.hide();
+        }
+    }
+
+    /**
+     * Poll for index rebuild progress
+     */
+    pollIndexRebuildProgress() {
+        if (this.indexRebuildRefreshInterval) {
+            clearInterval(this.indexRebuildRefreshInterval);
+        }
+
+        // Set up polling interval for index rebuild progress
+        this.indexRebuildRefreshInterval = setInterval(async () => {
+            await this.refreshEmbeddingStats();
+        }, this.STATS_REFRESH_INTERVAL);
+
+        // Stop polling after 5 minutes to avoid indefinite polling
+        setTimeout(() => {
+            if (this.indexRebuildRefreshInterval) {
+                clearInterval(this.indexRebuildRefreshInterval);
+                this.indexRebuildRefreshInterval = null;
+            }
+        }, 5 * 60 * 1000);
+    }
+
+    /**
+     * Refresh embedding statistics
+     */
+    async refreshEmbeddingStats() {
+        if (!this.$widget) return;
+
+        try {
+            const response = await server.get<EmbeddingStats>('llm/embeddings/stats');
+
+            if (response && response.success) {
+                const stats = response.stats;
+
+                // Update stats display
+                this.$widget.find('.embedding-processed-notes').text(stats.embeddedNotesCount);
+                this.$widget.find('.embedding-total-notes').text(stats.totalNotesCount);
+                this.$widget.find('.embedding-queued-notes').text(stats.queuedNotesCount);
+                this.$widget.find('.embedding-failed-notes').text(stats.failedNotesCount);
+
+                if (stats.lastProcessedDate) {
+                    const date = new Date(stats.lastProcessedDate);
+                    this.$widget.find('.embedding-last-processed').text(date.toLocaleString());
+                } else {
+                    this.$widget.find('.embedding-last-processed').text('-');
+                }
+
+                // Update progress bar
+                const $progressBar = this.$widget.find('.embedding-progress');
+                const progressPercent = stats.percentComplete;
+                $progressBar.css('width', `${progressPercent}%`);
+                $progressBar.attr('aria-valuenow', progressPercent.toString());
+                $progressBar.text(`${progressPercent}%`);
+
+                // Update status text
+                let statusText;
+                if (stats.queuedNotesCount > 0) {
+                    statusText = t("ai_llm.agent.processing", { percentage: progressPercent });
+                } else if (stats.embeddedNotesCount === 0) {
+                    statusText = t("ai_llm.not_started");
+                } else if (stats.embeddedNotesCount === stats.totalNotesCount) {
+                    statusText = t("ai_llm.complete");
+
+                    // Clear polling interval if processing is complete
+                    if (this.indexRebuildRefreshInterval) {
+                        clearInterval(this.indexRebuildRefreshInterval);
+                        this.indexRebuildRefreshInterval = null;
+                    }
+                } else {
+                    statusText = t("ai_llm.partial", { percentage: progressPercent });
+                }
+
+                this.$widget.find('.embedding-status-text').text(statusText);
+            }
+        } catch (e) {
+            console.error('Error fetching embedding stats:', e);
+        }
+    }
+
+    /**
+     * Fetch failed embedding notes
+     */
+    async fetchFailedEmbeddingNotes() {
+        if (!this.$widget) return;
+
+        try {
+            const response = await server.get<FailedEmbeddingNotes>('llm/embeddings/failed');
+
+            if (response && response.success) {
+                const failedNotes = response.failedNotes || [];
+                const $failedNotesList = this.$widget.find('.embedding-failed-notes-list');
+
+                if (failedNotes.length === 0) {
+                    $failedNotesList.html(`<div class="alert alert-info">${t("ai_llm.no_failed_embeddings")}</div>`);
+                    return;
+                }
+
+                // Create a table with failed notes
+                let html = `
+                <table class="table table-sm table-striped">
+                    <thead>
+                        <tr>
+                            <th>${t("ai_llm.note_title")}</th>
+                            <th>${t("ai_llm.error")}</th>
+                            <th>${t("ai_llm.last_attempt")}</th>
+                            <th>${t("ai_llm.actions")}</th>
+                        </tr>
+                    </thead>
+                    <tbody>
+                `;
+
+                for (const note of failedNotes) {
+                    const date = new Date(note.lastAttempt);
+                    const isPermanent = note.isPermanent;
+                    const noteTitle = note.title || note.noteId;
+
+                    html += `
+                    <tr data-note-id="${note.noteId}">
+                        <td><a href="#" class="open-note">${noteTitle}</a></td>
+                        <td>${note.error}</td>
+                        <td>${date.toLocaleString()}</td>
+                        <td>
+                            <button class="btn btn-sm btn-outline-secondary retry-embedding" ${isPermanent ? 'disabled' : ''}>
+                                ${t("ai_llm.retry")}
+                            </button>
+                        </td>
+                    </tr>
+                    `;
+                }
+
+                html += `
+                    </tbody>
+                </table>
+                `;
+
+                $failedNotesList.html(html);
+
+                // Add event handlers for retry buttons
+                $failedNotesList.find('.retry-embedding').on('click', async function() {
+                    const noteId = $(this).closest('tr').data('note-id');
+                    try {
+                        await server.post('llm/embeddings/retry', { noteId });
+                        toastService.showMessage(t("ai_llm.retry_queued"));
+                        // Remove this row or update status
+                        $(this).closest('tr').remove();
+                    } catch (e) {
+                        console.error('Error retrying embedding:', e);
+                        toastService.showError(t("ai_llm.retry_failed"));
+                    }
+                });
+
+                // Add event handlers for open note links
+                $failedNotesList.find('.open-note').on('click', function(e) {
+                    e.preventDefault();
+                    const noteId = $(this).closest('tr').data('note-id');
+                    window.open(`#${noteId}`, '_blank');
+                });
+            }
+        } catch (e) {
+            console.error('Error fetching failed embedding notes:', e);
+        }
+    }
+
+    /**
+     * Helper to get display name for providers
+     */
+    getProviderDisplayName(provider: string): string {
+        switch(provider) {
+            case 'openai': return 'OpenAI';
+            case 'anthropic': return 'Anthropic';
+            case 'ollama': return 'Ollama';
+            case 'voyage': return 'Voyage';
+            case 'local': return 'Local';
+            default: return provider.charAt(0).toUpperCase() + provider.slice(1);
+        }
+    }
+
+    /**
+     * Called when the options have been loaded from the server
+     */
+    optionsLoaded(options: OptionMap) {
+        if (!this.$widget) return;
+
+        // AI Options
+        this.$widget.find('.ai-enabled').prop('checked', options.aiEnabled !== 'false');
+        this.$widget.find('.ai-temperature').val(options.aiTemperature || '0.7');
+        this.$widget.find('.ai-system-prompt').val(options.aiSystemPrompt || '');
+        this.$widget.find('.ai-provider-precedence').val(options.aiProviderPrecedence || 'openai,anthropic,ollama');
+
+        // OpenAI Section
+        this.$widget.find('.openai-api-key').val(options.openaiApiKey || '');
+        this.$widget.find('.openai-base-url').val(options.openaiBaseUrl || 'https://api.openai_llm.com/v1');
+        this.$widget.find('.openai-default-model').val(options.openaiDefaultModel || 'gpt-4o');
+        this.$widget.find('.openai-embedding-model').val(options.openaiEmbeddingModel || 'text-embedding-3-small');
+
+        // Anthropic Section
+        this.$widget.find('.anthropic-api-key').val(options.anthropicApiKey || '');
+        this.$widget.find('.anthropic-base-url').val(options.anthropicBaseUrl || 'https://api.anthropic.com');
+        this.$widget.find('.anthropic-default-model').val(options.anthropicDefaultModel || 'claude-3-opus-20240229');
+
+        // Voyage Section
+        this.$widget.find('.voyage-api-key').val(options.voyageApiKey || '');
+        this.$widget.find('.voyage-embedding-model').val(options.voyageEmbeddingModel || 'voyage-2');
+
+        // Ollama Section
+        this.$widget.find('.ollama-base-url').val(options.ollamaBaseUrl || 'http://localhost:11434');
+        this.$widget.find('.ollama-default-model').val(options.ollamaDefaultModel || 'llama3');
+        this.$widget.find('.ollama-embedding-model').val(options.ollamaEmbeddingModel || 'nomic-embed-text');
+
+        // Embedding Options
+        this.$widget.find('.embedding-provider-precedence').val(options.embeddingProviderPrecedence || 'openai,voyage,ollama,local');
+        this.$widget.find('.embedding-auto-update-enabled').prop('checked', options.embeddingAutoUpdateEnabled !== 'false');
+        this.$widget.find('.enable-automatic-indexing').prop('checked', options.enableAutomaticIndexing !== 'false');
+        this.$widget.find('.embedding-similarity-threshold').val(options.embeddingSimilarityThreshold || '0.75');
+        this.$widget.find('.max-notes-per-llm-query').val(options.maxNotesPerLlmQuery || '3');
+        this.$widget.find('.embedding-dimension-strategy').val(options.embeddingDimensionStrategy || 'auto');
+        this.$widget.find('.embedding-batch-size').val(options.embeddingBatchSize || '10');
+        this.$widget.find('.embedding-update-interval').val(options.embeddingUpdateInterval || '5000');
+
+        // Display validation warnings
+        this.displayValidationWarnings();
+    }
+
+    cleanup() {
+        // Clear intervals
+        if (this.statsRefreshInterval) {
+            clearInterval(this.statsRefreshInterval);
+            this.statsRefreshInterval = null;
+        }
+
+        if (this.indexRebuildRefreshInterval) {
+            clearInterval(this.indexRebuildRefreshInterval);
+            this.indexRebuildRefreshInterval = null;
+        }
+    }
+}
diff --git a/src/public/app/widgets/type_widgets/options/ai_settings/index.ts b/src/public/app/widgets/type_widgets/options/ai_settings/index.ts
new file mode 100644
index 000000000..487abb407
--- /dev/null
+++ b/src/public/app/widgets/type_widgets/options/ai_settings/index.ts
@@ -0,0 +1,2 @@
+import AiSettingsWidget from './ai_settings_widget.js';
+export default AiSettingsWidget;
\ No newline at end of file
diff --git a/src/public/app/widgets/type_widgets/options/ai_settings/interfaces.ts b/src/public/app/widgets/type_widgets/options/ai_settings/interfaces.ts
new file mode 100644
index 000000000..2a3326ced
--- /dev/null
+++ b/src/public/app/widgets/type_widgets/options/ai_settings/interfaces.ts
@@ -0,0 +1,69 @@
+// Interface for the Ollama model response
+export interface OllamaModelResponse {
+    success: boolean;
+    models: Array<{
+        name: string;
+        model: string;
+        details?: {
+            family?: string;
+            parameter_size?: string;
+        }
+    }>;
+}
+
+// Interface for embedding statistics
+export interface EmbeddingStats {
+    success: boolean;
+    stats: {
+        totalNotesCount: number;
+        embeddedNotesCount: number;
+        queuedNotesCount: number;
+        failedNotesCount: number;
+        lastProcessedDate: string | null;
+        percentComplete: number;
+    }
+}
+
+// Interface for failed embedding notes
+export interface FailedEmbeddingNotes {
+    success: boolean;
+    failedNotes: Array<{
+        noteId: string;
+        title?: string;
+        operation: string;
+        attempts: number;
+        lastAttempt: string;
+        error: string;
+        failureType: string;
+        chunks: number;
+        isPermanent: boolean;
+    }>;
+}
+
+export interface OpenAIModelResponse {
+    success: boolean;
+    chatModels: Array<{
+        id: string;
+        name: string;
+        type: string;
+    }>;
+    embeddingModels: Array<{
+        id: string;
+        name: string;
+        type: string;
+    }>;
+}
+
+export interface AnthropicModelResponse {
+    success: boolean;
+    chatModels: Array<{
+        id: string;
+        name: string;
+        type: string;
+    }>;
+    embeddingModels: Array<{
+        id: string;
+        name: string;
+        type: string;
+    }>;
+}
\ No newline at end of file
diff --git a/src/public/app/widgets/type_widgets/options/ai_settings/providers.ts b/src/public/app/widgets/type_widgets/options/ai_settings/providers.ts
new file mode 100644
index 000000000..c3b35e34d
--- /dev/null
+++ b/src/public/app/widgets/type_widgets/options/ai_settings/providers.ts
@@ -0,0 +1,318 @@
+import server from "../../../../services/server.js";
+import toastService from "../../../../services/toast.js";
+import { t } from "../../../../services/i18n.js";
+import options from "../../../../services/options.js";
+import type { OpenAIModelResponse, AnthropicModelResponse, OllamaModelResponse } from "./interfaces.js";
+
+export class ProviderService {
+    constructor(private $widget: JQuery<HTMLElement>) {
+        // Initialize Voyage models (since they don't have a dynamic refresh yet)
+        this.initializeVoyageModels();
+    }
+
+    /**
+     * Initialize Voyage models with default values and ensure proper selection
+     */
+    private initializeVoyageModels() {
+        setTimeout(() => {
+            const $voyageModelSelect = this.$widget.find('.voyage-embedding-model');
+            if ($voyageModelSelect.length > 0) {
+                const currentValue = $voyageModelSelect.val();
+                this.ensureSelectedValue($voyageModelSelect, currentValue, 'voyageEmbeddingModel');
+            }
+        }, 100); // Small delay to ensure the widget is fully initialized
+    }
+
+    /**
+     * Ensures the dropdown has the correct value set, prioritizing:
+     * 1. Current UI value if present
+     * 2. Value from database options if available
+     * 3. Falling back to first option if neither is available
+     */
+    private ensureSelectedValue($select: JQuery<HTMLElement>, currentValue: string | number | string[] | undefined | null, optionName: string) {
+        if (currentValue) {
+            $select.val(currentValue);
+            // If the value doesn't exist anymore, select the first option
+            if (!$select.val()) {
+                $select.prop('selectedIndex', 0);
+            }
+        } else {
+            // If no current value exists in the dropdown but there's a default in the database
+            const savedModel = options.get(optionName);
+            if (savedModel) {
+                $select.val(savedModel);
+                // If the saved model isn't in the dropdown, select the first option
+                if (!$select.val()) {
+                    $select.prop('selectedIndex', 0);
+                }
+            }
+        }
+    }
+
+    /**
+     * Refreshes the list of OpenAI models
+     * @param showLoading Whether to show loading indicators and toasts
+     * @param openaiModelsRefreshed Reference to track if models have been refreshed
+     * @returns Promise that resolves when the refresh is complete
+     */
+    async refreshOpenAIModels(showLoading: boolean, openaiModelsRefreshed: boolean): Promise<boolean> {
+        if (!this.$widget) return false;
+
+        const $refreshOpenAIModels = this.$widget.find('.refresh-openai-models');
+
+        // If we've already refreshed and we're not forcing a refresh, don't do it again
+        if (openaiModelsRefreshed && !showLoading) {
+            return openaiModelsRefreshed;
+        }
+
+        if (showLoading) {
+            $refreshOpenAIModels.prop('disabled', true);
+            $refreshOpenAIModels.html(`<i class="spinner-border spinner-border-sm"></i>`);
+        }
+
+        try {
+            const openaiBaseUrl = this.$widget.find('.openai-base-url').val() as string;
+            const response = await server.get<OpenAIModelResponse>(`llm/providers/openai/models?baseUrl=${encodeURIComponent(openaiBaseUrl)}`);
+
+            if (response && response.success) {
+                // Update the chat models dropdown
+                if (response.chatModels?.length > 0) {
+                    const $chatModelSelect = this.$widget.find('.openai-default-model');
+                    const currentChatValue = $chatModelSelect.val();
+
+                    // Clear existing options
+                    $chatModelSelect.empty();
+
+                    // Sort models by name
+                    const sortedChatModels = [...response.chatModels].sort((a, b) => a.name.localeCompare(b.name));
+
+                    // Add models to the dropdown
+                    sortedChatModels.forEach(model => {
+                        $chatModelSelect.append(`<option value="${model.id}">${model.name}</option>`);
+                    });
+
+                    // Try to restore the previously selected value
+                    this.ensureSelectedValue($chatModelSelect, currentChatValue, 'openaiDefaultModel');
+                }
+
+                // Update the embedding models dropdown
+                if (response.embeddingModels?.length > 0) {
+                    const $embedModelSelect = this.$widget.find('.openai-embedding-model');
+                    const currentEmbedValue = $embedModelSelect.val();
+
+                    // Clear existing options
+                    $embedModelSelect.empty();
+
+                    // Sort models by name
+                    const sortedEmbedModels = [...response.embeddingModels].sort((a, b) => a.name.localeCompare(b.name));
+
+                    // Add models to the dropdown
+                    sortedEmbedModels.forEach(model => {
+                        $embedModelSelect.append(`<option value="${model.id}">${model.name}</option>`);
+                    });
+
+                    // Try to restore the previously selected value
+                    this.ensureSelectedValue($embedModelSelect, currentEmbedValue, 'openaiEmbeddingModel');
+                }
+
+                if (showLoading) {
+                    // Show success message
+                    const totalModels = (response.chatModels?.length || 0) + (response.embeddingModels?.length || 0);
+                    toastService.showMessage(`${totalModels} OpenAI models found.`);
+                }
+
+                return true;
+            } else if (showLoading) {
+                toastService.showError(`No OpenAI models found. Please check your API key and settings.`);
+            }
+
+            return openaiModelsRefreshed;
+        } catch (e) {
+            console.error(`Error fetching OpenAI models:`, e);
+            if (showLoading) {
+                toastService.showError(`Error fetching OpenAI models: ${e}`);
+            }
+            return openaiModelsRefreshed;
+        } finally {
+            if (showLoading) {
+                $refreshOpenAIModels.prop('disabled', false);
+                $refreshOpenAIModels.html(`<span class="bx bx-refresh"></span>`);
+            }
+        }
+    }
+
+    /**
+     * Refreshes the list of Anthropic models
+     * @param showLoading Whether to show loading indicators and toasts
+     * @param anthropicModelsRefreshed Reference to track if models have been refreshed
+     * @returns Promise that resolves when the refresh is complete
+     */
+    async refreshAnthropicModels(showLoading: boolean, anthropicModelsRefreshed: boolean): Promise<boolean> {
+        if (!this.$widget) return false;
+
+        const $refreshAnthropicModels = this.$widget.find('.refresh-anthropic-models');
+
+        // If we've already refreshed and we're not forcing a refresh, don't do it again
+        if (anthropicModelsRefreshed && !showLoading) {
+            return anthropicModelsRefreshed;
+        }
+
+        if (showLoading) {
+            $refreshAnthropicModels.prop('disabled', true);
+            $refreshAnthropicModels.html(`<i class="spinner-border spinner-border-sm"></i>`);
+        }
+
+        try {
+            const anthropicBaseUrl = this.$widget.find('.anthropic-base-url').val() as string;
+            const response = await server.get<AnthropicModelResponse>(`llm/providers/anthropic/models?baseUrl=${encodeURIComponent(anthropicBaseUrl)}`);
+
+            if (response && response.success) {
+                // Update the chat models dropdown
+                if (response.chatModels?.length > 0) {
+                    const $chatModelSelect = this.$widget.find('.anthropic-default-model');
+                    const currentChatValue = $chatModelSelect.val();
+
+                    // Clear existing options
+                    $chatModelSelect.empty();
+
+                    // Sort models by name
+                    const sortedChatModels = [...response.chatModels].sort((a, b) => a.name.localeCompare(b.name));
+
+                    // Add models to the dropdown
+                    sortedChatModels.forEach(model => {
+                        $chatModelSelect.append(`<option value="${model.id}">${model.name}</option>`);
+                    });
+
+                    // Try to restore the previously selected value
+                    this.ensureSelectedValue($chatModelSelect, currentChatValue, 'anthropicDefaultModel');
+                }
+
+                // Handle embedding models if they exist
+                if (response.embeddingModels?.length > 0 && showLoading) {
+                    toastService.showMessage(`Found ${response.embeddingModels.length} Anthropic embedding models.`);
+                }
+
+                if (showLoading) {
+                    // Show success message
+                    const totalModels = (response.chatModels?.length || 0) + (response.embeddingModels?.length || 0);
+                    toastService.showMessage(`${totalModels} Anthropic models found.`);
+                }
+
+                return true;
+            } else if (showLoading) {
+                toastService.showError(`No Anthropic models found. Please check your API key and settings.`);
+            }
+
+            return anthropicModelsRefreshed;
+        } catch (e) {
+            console.error(`Error fetching Anthropic models:`, e);
+            if (showLoading) {
+                toastService.showError(`Error fetching Anthropic models: ${e}`);
+            }
+            return anthropicModelsRefreshed;
+        } finally {
+            if (showLoading) {
+                $refreshAnthropicModels.prop('disabled', false);
+                $refreshAnthropicModels.html(`<span class="bx bx-refresh"></span>`);
+            }
+        }
+    }
+
+    /**
+     * Refreshes the list of Ollama models
+     * @param showLoading Whether to show loading indicators and toasts
+     * @param ollamaModelsRefreshed Reference to track if models have been refreshed
+     * @returns Promise that resolves when the refresh is complete
+     */
+    async refreshOllamaModels(showLoading: boolean, ollamaModelsRefreshed: boolean): Promise<boolean> {
+        if (!this.$widget) return false;
+
+        const $refreshModels = this.$widget.find('.refresh-models');
+
+        // If we've already refreshed and we're not forcing a refresh, don't do it again
+        if (ollamaModelsRefreshed && !showLoading) {
+            return ollamaModelsRefreshed;
+        }
+
+        if (showLoading) {
+            $refreshModels.prop('disabled', true);
+            $refreshModels.text(t("ai_llm.refreshing_models"));
+        }
+
+        try {
+            const ollamaBaseUrl = this.$widget.find('.ollama-base-url').val() as string;
+            const response = await server.get<OllamaModelResponse>(`llm/providers/ollama/models?baseUrl=${encodeURIComponent(ollamaBaseUrl)}`);
+
+            if (response && response.success && response.models && response.models.length > 0) {
+                const $embedModelSelect = this.$widget.find('.ollama-embedding-model');
+                const currentValue = $embedModelSelect.val();
+
+                // Clear existing options
+                $embedModelSelect.empty();
+
+                // Add embedding-specific models first
+                const embeddingModels = response.models.filter(model =>
+                    model.name.includes('embed') || model.name.includes('bert'));
+
+                embeddingModels.forEach(model => {
+                    $embedModelSelect.append(`<option value="${model.name}">${model.name}</option>`);
+                });
+
+                if (embeddingModels.length > 0) {
+                    // Add separator if we have embedding models
+                    $embedModelSelect.append(`<option disabled>─────────────</option>`);
+                }
+
+                // Then add general models which can be used for embeddings too
+                const generalModels = response.models.filter(model =>
+                    !model.name.includes('embed') && !model.name.includes('bert'));
+
+                generalModels.forEach(model => {
+                    $embedModelSelect.append(`<option value="${model.name}">${model.name}</option>`);
+                });
+
+                // Try to restore the previously selected value
+                this.ensureSelectedValue($embedModelSelect, currentValue, 'ollamaEmbeddingModel');
+
+                // Also update the LLM model dropdown
+                const $modelSelect = this.$widget.find('.ollama-default-model');
+                const currentModelValue = $modelSelect.val();
+
+                // Clear existing options
+                $modelSelect.empty();
+
+                // Sort models by name to make them easier to find
+                const sortedModels = [...response.models].sort((a, b) => a.name.localeCompare(b.name));
+
+                // Add all models to the dropdown
+                sortedModels.forEach(model => {
+                    $modelSelect.append(`<option value="${model.name}">${model.name}</option>`);
+                });
+
+                // Try to restore the previously selected value
+                this.ensureSelectedValue($modelSelect, currentModelValue, 'ollamaDefaultModel');
+
+                if (showLoading) {
+                    toastService.showMessage(`${response.models.length} Ollama models found.`);
+                }
+
+                return true;
+            } else if (showLoading) {
+                toastService.showError(`No Ollama models found. Please check if Ollama is running.`);
+            }
+
+            return ollamaModelsRefreshed;
+        } catch (e) {
+            console.error(`Error fetching Ollama models:`, e);
+            if (showLoading) {
+                toastService.showError(`Error fetching Ollama models: ${e}`);
+            }
+            return ollamaModelsRefreshed;
+        } finally {
+            if (showLoading) {
+                $refreshModels.prop('disabled', false);
+                $refreshModels.html(`<span class="bx bx-refresh"></span>`);
+            }
+        }
+    }
+}
diff --git a/src/public/app/widgets/type_widgets/options/ai_settings/template.ts b/src/public/app/widgets/type_widgets/options/ai_settings/template.ts
new file mode 100644
index 000000000..f8cd79c81
--- /dev/null
+++ b/src/public/app/widgets/type_widgets/options/ai_settings/template.ts
@@ -0,0 +1,305 @@
+import { t } from "../../../../services/i18n.js";
+
+export const TPL = `
+<div class="options-section">
+    <h4>${t("ai_llm.title")}</h4>
+
+    <!-- Add warning alert div -->
+    <div class="provider-validation-warning alert alert-warning" style="display: none;"></div>
+
+    <div class="form-group">
+        <label class="tn-checkbox">
+            <input class="ai-enabled form-check-input" type="checkbox">
+            ${t("ai_llm.enable_ai_features")}
+        </label>
+        <div class="form-text">${t("ai_llm.enable_ai_description")}</div>
+    </div>
+</div>
+
+<div class="options-section">
+    <h4>${t("ai_llm.embedding_statistics")}</h4>
+    <div class="embedding-stats-container">
+        <div class="embedding-stats">
+            <div class="row">
+                <div class="col-md-6">
+                    <div><strong>${t("ai_llm.processed_notes")}:</strong> <span class="embedding-processed-notes">-</span></div>
+                    <div><strong>${t("ai_llm.total_notes")}:</strong> <span class="embedding-total-notes">-</span></div>
+                    <div><strong>${t("ai_llm.progress")}:</strong> <span class="embedding-status-text">-</span></div>
+                </div>
+
+                <div class="col-md-6">
+                    <div><strong>${t("ai_llm.queued_notes")}:</strong> <span class="embedding-queued-notes">-</span></div>
+                    <div><strong>${t("ai_llm.failed_notes")}:</strong> <span class="embedding-failed-notes">-</span></div>
+                    <div><strong>${t("ai_llm.last_processed")}:</strong> <span class="embedding-last-processed">-</span></div>
+                </div>
+            </div>
+        </div>
+        <div class="progress mt-1" style="height: 10px;">
+            <div class="progress-bar embedding-progress" role="progressbar" style="width: 0%;"
+                aria-valuenow="0" aria-valuemin="0" aria-valuemax="100">0%</div>
+        </div>
+        <div class="mt-2">
+            <button class="btn btn-sm btn-outline-secondary embedding-refresh-stats">
+                ${t("ai_llm.refresh_stats")}
+            </button>
+        </div>
+    </div>
+
+    <hr/>
+    <!-- Failed embeddings section -->
+    <h5>${t("ai_llm.failed_notes")}</h4>
+    <div class="form-group mt-4">
+        <div class="embedding-failed-notes-container">
+            <div class="embedding-failed-notes-list">
+                <div class="alert alert-info">${t("ai_llm.no_failed_embeddings")}</div>
+            </div>
+        </div>
+    </div>
+</div>
+
+<div class="ai-providers-section options-section">
+    <h4>${t("ai_llm.provider_configuration")}</h4>
+
+    <div class="form-group">
+        <label>${t("ai_llm.provider_precedence")}</label>
+        <input type="text" class="ai-provider-precedence form-control" placeholder="openai,anthropic,ollama">
+        <div class="form-text">${t("ai_llm.provider_precedence_description")}</div>
+    </div>
+
+    <div class="form-group">
+        <label>${t("ai_llm.temperature")}</label>
+        <input class="ai-temperature form-control" type="number" min="0" max="2" step="0.1">
+        <div class="form-text">${t("ai_llm.temperature_description")}</div>
+    </div>
+
+    <div class="form-group">
+        <label>${t("ai_llm.system_prompt")}</label>
+        <textarea class="ai-system-prompt form-control" rows="3"></textarea>
+        <div class="form-text">${t("ai_llm.system_prompt_description")}</div>
+    </div>
+</div>
+
+<nav class="options-section-tabs">
+    <div class="nav nav-tabs" id="nav-tab" role="tablist">
+        <button class="nav-link active" id="nav-openai-tab" data-bs-toggle="tab" data-bs-target="#nav-openai" type="button" role="tab" aria-controls="nav-openai" aria-selected="true">${t("ai_llm.openai_tab")}</button>
+        <button class="nav-link" id="nav-anthropic-tab" data-bs-toggle="tab" data-bs-target="#nav-anthropic" type="button" role="tab" aria-controls="nav-anthropic" aria-selected="false">${t("ai_llm.anthropic_tab")}</button>
+        <button class="nav-link" id="nav-voyage-tab" data-bs-toggle="tab" data-bs-target="#nav-voyage" type="button" role="tab" aria-controls="nav-voyage" aria-selected="false">${t("ai_llm.voyage_tab")}</button>
+        <button class="nav-link" id="nav-ollama-tab" data-bs-toggle="tab" data-bs-target="#nav-ollama" type="button" role="tab" aria-controls="nav-ollama" aria-selected="false">${t("ai_llm.ollama_tab")}</button>
+    </div>
+</nav>
+<div class="options-section">
+    <div class="tab-content" id="nav-tabContent">
+        <div class="tab-pane fade show active" id="nav-openai" role="tabpanel" aria-labelledby="nav-openai-tab">
+            <div class="card">
+                <div class="card-header">
+                    <h5>${t("ai_llm.openai_settings")}</h5>
+                </div>
+                <div class="card-body">
+                    <div class="form-group">
+                        <label>${t("ai_llm.api_key")}</label>
+                        <input type="password" class="openai-api-key form-control" autocomplete="off" />
+                        <div class="form-text">${t("ai_llm.openai_api_key_description")}</div>
+                    </div>
+
+                    <div class="form-group">
+                        <label>${t("ai_llm.url")}</label>
+                        <input type="text" class="openai-base-url form-control" />
+                        <div class="form-text">${t("ai_llm.openai_url_description")}</div>
+                    </div>
+
+                    <div class="form-group">
+                        <label>${t("ai_llm.model")}</label>
+                        <select class="openai-default-model form-control">
+                            <option value="gpt-4o">GPT-4o (recommended)</option>
+                            <option value="gpt-4">GPT-4</option>
+                            <option value="gpt-3.5-turbo">GPT-3.5 Turbo</option>
+                        </select>
+                        <div class="form-text">${t("ai_llm.openai_model_description")}</div>
+                        <button class="btn btn-sm btn-outline-secondary refresh-openai-models">${t("ai_llm.refresh_models")}</button>
+                    </div>
+
+                    <div class="form-group">
+                        <label>${t("ai_llm.embedding_model")}</label>
+                        <select class="openai-embedding-model form-control">
+                            <option value="text-embedding-3-small">text-embedding-3-small (recommended)</option>
+                            <option value="text-embedding-3-large">text-embedding-3-large</option>
+                        </select>
+                        <div class="form-text">${t("ai_llm.openai_embedding_model_description")}</div>
+                    </div>
+                </div>
+            </div>
+        </div>
+        <div class="tab-pane fade" id="nav-anthropic" role="tabpanel" aria-labelledby="nav-anthropic-tab">
+            <div class="card">
+                <div class="card-header">
+                    <h5>${t("ai_llm.anthropic_settings")}</h5>
+                </div>
+                <div class="card-body">
+                    <div class="form-group">
+                        <label>${t("ai_llm.api_key")}</label>
+                        <input type="password" class="anthropic-api-key form-control" autocomplete="off" />
+                        <div class="form-text">${t("ai_llm.anthropic_api_key_description")}</div>
+                    </div>
+
+                    <div class="form-group">
+                        <label>${t("ai_llm.url")}</label>
+                        <input type="text" class="anthropic-base-url form-control" />
+                        <div class="form-text">${t("ai_llm.anthropic_url_description")}</div>
+                    </div>
+
+                    <div class="form-group">
+                        <label>${t("ai_llm.model")}</label>
+                        <select class="anthropic-default-model form-control">
+                            <option value="claude-3-opus-20240229">Claude 3 Opus (recommended)</option>
+                            <option value="claude-3-sonnet-20240229">Claude 3 Sonnet</option>
+                            <option value="claude-3-haiku-20240307">Claude 3 Haiku</option>
+                        </select>
+                        <div class="form-text">${t("ai_llm.anthropic_model_description")}</div>
+                        <button class="btn btn-sm btn-outline-secondary refresh-anthropic-models">${t("ai_llm.refresh_models")}</button>
+                    </div>
+                </div>
+            </div>
+        </div>
+        <div class="tab-pane fade" id="nav-voyage" role="tabpanel" aria-labelledby="nav-voyage-tab">
+            <div class="card">
+                <div class="card-header">
+                    <h5>${t("ai_llm.voyage_settings")}</h5>
+                </div>
+                <div class="card-body">
+                    <div class="form-group">
+                        <label>${t("ai_llm.api_key")}</label>
+                        <input type="password" class="voyage-api-key form-control" autocomplete="off" />
+                        <div class="form-text">${t("ai_llm.voyage_api_key_description")}</div>
+                    </div>
+
+                    <div class="form-group">
+                        <label>${t("ai_llm.embedding_model")}</label>
+                        <select class="voyage-embedding-model form-control">
+                            <option value="voyage-2">Voyage-2 (recommended)</option>
+                            <option value="voyage-2-code">Voyage-2-Code</option>
+                            <option value="voyage-large-2">Voyage-Large-2</option>
+                        </select>
+                        <div class="form-text">${t("ai_llm.voyage_embedding_model_description")}</div>
+                    </div>
+                </div>
+            </div>
+        </div>
+        <div class="tab-pane fade" id="nav-ollama" role="tabpanel" aria-labelledby="nav-ollama-tab">
+            <div class="card">
+                <div class="card-header">
+                    <h5>${t("ai_llm.ollama_settings")}</h5>
+                </div>
+                <div class="card-body">
+                    <div class="form-group">
+                        <label>${t("ai_llm.url")}</label>
+                        <input type="text" class="ollama-base-url form-control" />
+                        <div class="form-text">${t("ai_llm.ollama_url_description")}</div>
+                    </div>
+
+                    <div class="form-group">
+                        <label>${t("ai_llm.model")}</label>
+                        <select class="ollama-default-model form-control">
+                            <option value="llama3">llama3 (recommended)</option>
+                            <option value="mistral">mistral</option>
+                            <option value="phi3">phi3</option>
+                        </select>
+                        <div class="form-text">${t("ai_llm.ollama_model_description")}</div>
+                        <button class="btn btn-sm btn-outline-secondary refresh-models"><span class="bx bx-refresh"></span></button>
+                    </div>
+
+                    <div class="form-group">
+                        <label>${t("ai_llm.embedding_model")}</label>
+                        <select class="ollama-embedding-model form-control">
+                            <option value="nomic-embed-text">nomic-embed-text (recommended)</option>
+                            <option value="all-MiniLM-L6-v2">all-MiniLM-L6-v2</option>
+                        </select>
+                        <div class="form-text">${t("ai_llm.ollama_embedding_model_description")}</div>
+                    </div>
+                </div>
+            </div>
+        </div>
+    </div>
+</div>
+
+<div class="options-section">
+    <h4>${t("ai_llm.embeddings_configuration")}</h4>
+
+    <div class="form-group">
+        <label class="embedding-provider-label">${t("ai_llm.embedding_provider_precedence")}</label>
+        <input type="text" class="embedding-provider-precedence form-control" placeholder="openai,voyage,ollama,local">
+        <div class="form-text">${t("ai_llm.embedding_provider_precedence_description")}</div>
+    </div>
+
+    <div class="form-group">
+        <label>${t("ai_llm.embedding_dimension_strategy")}</label>
+        <select class="embedding-dimension-strategy form-control">
+            <option value="auto">${t("ai_llm.embedding_dimension_auto")}</option>
+            <option value="fixed-768">${t("ai_llm.embedding_dimension_fixed")} (768)</option>
+            <option value="fixed-1024">${t("ai_llm.embedding_dimension_fixed")} (1024)</option>
+            <option value="fixed-1536">${t("ai_llm.embedding_dimension_fixed")} (1536)</option>
+        </select>
+        <div class="form-text">${t("ai_llm.embedding_dimension_strategy_description")}</div>
+    </div>
+
+    <div class="form-group">
+        <label>${t("ai_llm.embedding_similarity_threshold")}</label>
+        <input class="embedding-similarity-threshold form-control" type="number" min="0" max="1" step="0.01">
+        <div class="form-text">${t("ai_llm.embedding_similarity_threshold_description")}</div>
+    </div>
+
+    <div class="form-group">
+        <label>${t("ai_llm.embedding_batch_size")}</label>
+        <input class="embedding-batch-size form-control" type="number" min="1" max="100" step="1">
+        <div class="form-text">${t("ai_llm.embedding_batch_size_description")}</div>
+    </div>
+
+    <div class="form-group">
+        <label>${t("ai_llm.embedding_update_interval")}</label>
+        <input class="embedding-update-interval form-control" type="number" min="100" max="60000" step="100">
+        <div class="form-text">${t("ai_llm.embedding_update_interval_description")}</div>
+    </div>
+
+    <div class="form-group">
+        <label>${t("ai_llm.max_notes_per_llm_query")}</label>
+        <input class="max-notes-per-llm-query form-control" type="number" min="1" max="20" step="1">
+        <div class="form-text">${t("ai_llm.max_notes_per_llm_query_description")}</div>
+    </div>
+
+    <div class="form-group">
+        <label class="tn-checkbox">
+            <input class="enable-automatic-indexing form-check-input" type="checkbox">
+            ${t("ai_llm.enable_automatic_indexing")}
+        </label>
+        <div class="form-text">${t("ai_llm.enable_automatic_indexing_description")}</div>
+    </div>
+
+    <div class="form-group mt-3">
+        <label class="tn-checkbox">
+            <input class="embedding-auto-update-enabled form-check-input" type="checkbox">
+            ${t("ai_llm.embedding_auto_update_enabled")}
+        </label>
+        <div class="form-text">${t("ai_llm.embedding_auto_update_enabled_description")}</div>
+    </div>
+
+    <!-- Recreate embeddings button -->
+    <div class="form-group mt-3">
+        <button class="btn btn-outline-primary recreate-embeddings">
+            ${t("ai_llm.recreate_embeddings")}
+        </button>
+        <div class="form-text">${t("ai_llm.recreate_embeddings_description")}</div>
+    </div>
+
+    <!-- Rebuild index button -->
+    <div class="form-group mt-3">
+        <button class="btn btn-outline-primary rebuild-embeddings-index">
+            ${t("ai_llm.rebuild_index")}
+        </button>
+        <div class="form-text">${t("ai_llm.rebuild_index_description")}</div>
+    </div>
+
+    <!-- Note about embedding provider precedence -->
+    <div class="form-group mt-3">
+        <h5>${t("ai_llm.embedding_providers_order")}</h5>
+        <div class="form-text mt-2">${t("ai_llm.embedding_providers_order_description")}</div>
+    </div>
+</div>`;
diff --git a/src/public/stylesheets/llm_chat.css b/src/public/stylesheets/llm_chat.css
new file mode 100644
index 000000000..aacdf543f
--- /dev/null
+++ b/src/public/stylesheets/llm_chat.css
@@ -0,0 +1,275 @@
+/* LLM Chat Panel Styles */
+.note-context-chat {
+    background-color: var(--main-background-color);
+}
+
+/* Message Styling */
+.chat-message {
+    margin-bottom: 1rem;
+}
+
+.message-avatar {
+    width: 36px;
+    height: 36px;
+    border-radius: 50%;
+    font-size: 1.25rem;
+    flex-shrink: 0;
+}
+
+.user-avatar {
+    background-color: var(--input-background-color);
+    color: var(--cmd-button-icon-color);
+}
+
+.assistant-avatar {
+    background-color: var(--subtle-border-color, var(--main-border-color));
+    color: var(--hover-item-text-color);
+}
+
+.message-content {
+    max-width: calc(100% - 50px);
+    box-shadow: 0 1px 3px rgba(0, 0, 0, 0.05);
+    color: var(--main-text-color);
+}
+
+.user-content {
+    border-radius: 0.5rem 0.5rem 0 0.5rem !important;
+    background-color: var(--input-background-color) !important;
+}
+
+.assistant-content {
+    border-radius: 0.5rem 0.5rem 0.5rem 0 !important;
+    background-color: var(--main-background-color);
+    border: 1px solid var(--subtle-border-color, var(--main-border-color));
+}
+
+/* Tool Execution Styling */
+.tool-execution-info {
+    margin-top: 0.75rem;
+    margin-bottom: 1.5rem;
+    border: 1px solid var(--subtle-border-color);
+    border-radius: 0.5rem;
+    overflow: hidden;
+    box-shadow: 0 1px 4px rgba(0, 0, 0, 0.05);
+    background-color: var(--main-background-color);
+    /* Add a subtle transition effect */
+    transition: all 0.2s ease-in-out;
+}
+
+.tool-execution-status {
+    background-color: var(--accented-background-color, rgba(0, 0, 0, 0.03)) !important;
+    border-radius: 0 !important;
+    padding: 0.5rem !important;
+    max-height: 250px !important;
+    overflow-y: auto;
+}
+
+.tool-execution-status .d-flex {
+    border-bottom: 1px solid var(--subtle-border-color);
+    padding-bottom: 0.5rem;
+    margin-bottom: 0.5rem;
+}
+
+.tool-step {
+    padding: 0.5rem;
+    margin-bottom: 0.75rem;
+    border-radius: 0.375rem;
+    background-color: var(--main-background-color);
+    border: 1px solid var(--subtle-border-color);
+    transition: background-color 0.2s ease;
+}
+
+.tool-step:hover {
+    background-color: rgba(0, 0, 0, 0.01);
+}
+
+.tool-step:last-child {
+    margin-bottom: 0;
+}
+
+/* Tool step specific styling */
+.tool-step.executing {
+    background-color: rgba(0, 123, 255, 0.05);
+    border-color: rgba(0, 123, 255, 0.2);
+}
+
+.tool-step.result {
+    background-color: rgba(40, 167, 69, 0.05);
+    border-color: rgba(40, 167, 69, 0.2);
+}
+
+.tool-step.error {
+    background-color: rgba(220, 53, 69, 0.05);
+    border-color: rgba(220, 53, 69, 0.2);
+}
+
+/* Tool result formatting */
+.tool-result pre {
+    margin: 0.5rem 0;
+    padding: 0.5rem;
+    background-color: rgba(0, 0, 0, 0.03);
+    border-radius: 0.25rem;
+    overflow: auto;
+    max-height: 300px;
+}
+
+.tool-result code {
+    font-family: "SFMono-Regular", Consolas, "Liberation Mono", Menlo, monospace;
+    font-size: 0.9em;
+}
+
+.tool-args code {
+    display: block;
+    padding: 0.5rem;
+    background-color: rgba(0, 0, 0, 0.03);
+    border-radius: 0.25rem;
+    margin-top: 0.25rem;
+    font-size: 0.85em;
+    color: var(--muted-text-color);
+    white-space: pre-wrap;
+    overflow: auto;
+    max-height: 100px;
+}
+
+/* Tool Execution in Chat Styling */
+.chat-tool-execution {
+    padding: 0 0 0 36px; /* Aligned with message content, accounting for avatar width */
+    width: 100%;
+    margin-bottom: 1rem;
+}
+
+.tool-execution-container {
+    background-color: var(--accented-background-color, rgba(245, 247, 250, 0.7));
+    border: 1px solid var(--subtle-border-color);
+    border-radius: 0.375rem;
+    box-shadow: 0 1px 3px rgba(0, 0, 0, 0.05);
+    overflow: hidden;
+    max-width: calc(100% - 20px);
+    transition: all 0.3s ease;
+}
+
+.tool-execution-container.collapsed {
+    display: none;
+}
+
+.tool-execution-header {
+    background-color: var(--main-background-color);
+    border-bottom: 1px solid var(--subtle-border-color);
+    margin-bottom: 0.5rem;
+    color: var(--muted-text-color);
+    font-weight: 500;
+    padding: 0.6rem 0.8rem;
+    cursor: pointer;
+    transition: background-color 0.2s ease;
+}
+
+.tool-execution-header:hover {
+    background-color: var(--hover-item-background-color, rgba(0, 0, 0, 0.03));
+}
+
+.tool-execution-toggle {
+    color: var(--muted-text-color) !important;
+    background: transparent !important;
+    padding: 0.2rem 0.4rem !important;
+    transition: transform 0.2s ease;
+}
+
+.tool-execution-toggle:hover {
+    color: var(--main-text-color) !important;
+}
+
+.tool-execution-toggle i.bx-chevron-down {
+    transform: rotate(0deg);
+    transition: transform 0.3s ease;
+}
+
+.tool-execution-toggle i.bx-chevron-right {
+    transform: rotate(-90deg);
+    transition: transform 0.3s ease;
+}
+
+.tool-execution-chat-steps {
+    padding: 0.5rem;
+    max-height: 300px;
+    overflow-y: auto;
+}
+
+/* Make error text more visible */
+.text-danger {
+    color: #dc3545 !important;
+}
+
+/* Sources Styling */
+.sources-container {
+    background-color: var(--accented-background-color, var(--main-background-color));
+    border-top: 1px solid var(--main-border-color);
+    color: var(--main-text-color);
+}
+
+.source-item {
+    transition: all 0.2s ease;
+    background-color: var(--main-background-color);
+    border-color: var(--subtle-border-color, var(--main-border-color)) !important;
+}
+
+.source-item:hover {
+    background-color: var(--link-hover-background, var(--hover-item-background-color));
+}
+
+.source-link {
+    color: var(--link-color, var(--hover-item-text-color));
+    text-decoration: none;
+    display: block;
+    width: 100%;
+}
+
+.source-link:hover {
+    color: var(--link-hover-color, var(--hover-item-text-color));
+}
+
+/* Input Area Styling */
+.note-context-chat-form {
+    background-color: var(--main-background-color);
+    border-top: 1px solid var(--main-border-color);
+}
+
+.context-option-container {
+    padding: 0.5rem 0;
+    border-bottom: 1px solid var(--subtle-border-color, var(--main-border-color));
+    color: var(--main-text-color);
+}
+
+.chat-input-container {
+    padding-top: 0.5rem;
+}
+
+.note-context-chat-input {
+    border-color: var(--subtle-border-color, var(--main-border-color));
+    background-color: var(--input-background-color) !important;
+    color: var(--input-text-color) !important;
+    resize: none;
+    transition: all 0.2s ease;
+    min-height: 50px;
+    max-height: 150px;
+}
+
+.note-context-chat-input:focus {
+    border-color: var(--input-focus-outline-color, var(--main-border-color));
+    box-shadow: 0 0 0 0.25rem var(--input-focus-outline-color, rgba(13, 110, 253, 0.25));
+}
+
+.note-context-chat-send-button {
+    width: 40px;
+    height: 40px;
+    align-self: flex-end;
+    background-color: var(--cmd-button-background-color) !important;
+    color: var(--cmd-button-text-color) !important;
+}
+
+/* Loading Indicator */
+.loading-indicator {
+    align-items: center;
+    justify-content: center;
+    padding: 1rem;
+    color: var(--muted-text-color);
+} 
\ No newline at end of file
diff --git a/src/public/stylesheets/style.css b/src/public/stylesheets/style.css
index 5673acb8f..41239294f 100644
--- a/src/public/stylesheets/style.css
+++ b/src/public/stylesheets/style.css
@@ -1804,6 +1804,187 @@ footer.file-footer button {
     margin: 5px;
 }
 
+/* AI Chat Widget Styles */
+.chat-widget {
+    display: flex;
+    flex-direction: column;
+    height: 100%;
+    overflow: hidden;
+}
+
+.chat-header {
+    display: flex;
+    justify-content: space-between;
+    align-items: center;
+    padding: 10px 15px;
+    border-bottom: 1px solid var(--main-border-color);
+    background-color: var(--accented-background-color);
+}
+
+.chat-title {
+    font-weight: bold;
+    flex-grow: 1;
+    overflow: hidden;
+    text-overflow: ellipsis;
+    white-space: nowrap;
+}
+
+.chat-actions {
+    display: flex;
+    gap: 5px;
+}
+
+.chat-messages {
+    flex-grow: 1;
+    overflow-y: auto;
+    padding: 15px;
+    display: flex;
+    flex-direction: column;
+    gap: 15px;
+}
+
+.chat-message {
+    display: flex;
+    gap: 10px;
+    max-width: 85%;
+}
+
+.chat-message-user {
+    align-self: flex-end;
+    flex-direction: row-reverse;
+}
+
+.chat-message-assistant {
+    align-self: flex-start;
+}
+
+.chat-message-avatar {
+    flex-shrink: 0;
+    width: 30px;
+    height: 30px;
+    border-radius: 50%;
+    background-color: var(--accented-background-color);
+    display: flex;
+    align-items: center;
+    justify-content: center;
+}
+
+.chat-message-user .chat-message-avatar {
+    background-color: var(--primary-color);
+    color: white;
+}
+
+.chat-message-assistant .chat-message-avatar {
+    background-color: var(--muted-text-color);
+    color: white;
+}
+
+.chat-message-content {
+    flex-grow: 1;
+    padding: 10px 15px;
+    border-radius: 12px;
+    background-color: var(--accented-background-color);
+    overflow-wrap: break-word;
+    word-break: break-word;
+}
+
+.chat-message-user .chat-message-content {
+    background-color: var(--primary-color);
+    color: white;
+}
+
+.chat-message-content pre {
+    background-color: var(--main-background-color);
+    border-radius: 5px;
+    padding: 10px;
+    overflow-x: auto;
+    margin: 10px 0;
+}
+
+.chat-message-user .chat-message-content pre {
+    background-color: rgba(255, 255, 255, 0.2);
+}
+
+.chat-message-content code {
+    font-family: monospace;
+    background-color: var(--main-background-color);
+    padding: 2px 4px;
+    border-radius: 3px;
+}
+
+.chat-message-user .chat-message-content code {
+    background-color: rgba(255, 255, 255, 0.2);
+}
+
+.chat-controls {
+    display: flex;
+    flex-direction: column;
+    padding: 15px;
+    gap: 10px;
+    border-top: 1px solid var(--main-border-color);
+}
+
+.chat-input-container {
+    position: relative;
+}
+
+.chat-input {
+    width: 100%;
+    resize: none;
+    padding-right: 40px;
+}
+
+.chat-buttons {
+    display: flex;
+    justify-content: space-between;
+}
+
+.chat-loading {
+    animation: chat-loading 1s infinite;
+    letter-spacing: 3px;
+}
+
+@keyframes chat-loading {
+    0% { opacity: 0.3; }
+    50% { opacity: 1; }
+    100% { opacity: 0.3; }
+}
+
+/* Right Pane Tab Styles */
+#right-pane-tab-container {
+    display: flex;
+    gap: 10px;
+}
+
+.right-pane-tab {
+    padding: 5px 10px;
+    cursor: pointer;
+    border-radius: 5px;
+    white-space: nowrap;
+    overflow: hidden;
+    text-overflow: ellipsis;
+    transition: background-color 0.2s ease;
+}
+
+.right-pane-tab:hover {
+    background-color: var(--hover-item-background-color);
+}
+
+.right-pane-tab.active {
+    background-color: var(--primary-color);
+    color: white;
+}
+
+.right-pane-tab .tab-title {
+    display: flex;
+    align-items: center;
+    gap: 5px;
+}
+
+.right-pane-tab .tab-title .bx {
+    font-size: 1.1em;
+}
+
 .admonition {
     --accent-color: var(--card-border-color);
     border: 1px solid var(--accent-color);
@@ -1811,12 +1992,7 @@ footer.file-footer button {
     background: var(--card-background-color);
     border-radius: 0.5em;
     padding: 1em;
-    margin: 1.25em 0;
-    position: relative;
-    padding-left: 2.5em;
-    overflow: hidden;
 }
-
 .admonition p:last-child {
     margin-bottom: 0;
 }
@@ -1835,6 +2011,61 @@ footer.file-footer button {
 .admonition.caution { --accent-color: #ff2e2e; }
 .admonition.warning { --accent-color: #e2aa03; }
 
+.ck-content .admonition.note::before { content: "\eb21"; }
+.ck-content .admonition.tip::before { content: "\ea0d"; }
+.ck-content .admonition.important::before { content: "\ea7c"; }
+.ck-content .admonition.caution::before { content: "\eac7"; }
+.ck-content .admonition.warning::before { content: "\eac5"; }
+
+.chat-options-container {
+    display: flex;
+    margin: 5px 0;
+    align-items: center;
+    padding: 0 10px;
+}
+
+.chat-option {
+    display: flex;
+    align-items: center;
+    font-size: 0.9em;
+    margin-right: 15px;
+    cursor: pointer;
+}
+
+.chat-option input[type="checkbox"] {
+    margin-right: 5px;
+}
+
+/* Style for thinking process in chat responses */
+.thinking-process {
+    background-color: rgba(0, 0, 0, 0.05);
+    border-left: 3px solid var(--main-text-color);
+    padding: 10px;
+    margin: 10px 0;
+    border-radius: 4px;
+}
+
+.thinking-step {
+    margin-bottom: 8px;
+    padding-left: 10px;
+}
+
+.thinking-step.observation {
+    border-left: 2px solid #69c7ff;
+}
+
+.thinking-step.hypothesis {
+    border-left: 2px solid #9839f7;
+}
+
+.thinking-step.evidence {
+    border-left: 2px solid #40c025;
+}
+
+.thinking-step.conclusion {
+    border-left: 2px solid #e2aa03;
+    font-weight: bold;
+}
 .admonition.note::before { content: "\eb21"; }
 .admonition.tip::before { content: "\ea0d"; }
 .admonition.important::before { content: "\ea7c"; }
@@ -1875,4 +2106,4 @@ footer.file-footer button {
 .bx-tn-toc::before {
     content: "\ec24";
     transform: rotate(180deg);
-}
\ No newline at end of file
+}
diff --git a/src/public/stylesheets/theme-next/llm-chat.css b/src/public/stylesheets/theme-next/llm-chat.css
new file mode 100644
index 000000000..dc3342485
--- /dev/null
+++ b/src/public/stylesheets/theme-next/llm-chat.css
@@ -0,0 +1,122 @@
+/* LLM Chat Launcher Widget Styles */
+.note-context-chat {
+    display: flex;
+    flex-direction: column;
+    height: 100%;
+    width: 100%;
+}
+
+.note-context-chat-container {
+    flex-grow: 1;
+    overflow-y: auto;
+    padding: 15px;
+}
+
+.chat-message {
+    display: flex;
+    margin-bottom: 15px;
+    max-width: 85%;
+}
+
+.chat-message.user-message {
+    margin-left: auto;
+}
+
+.chat-message.assistant-message {
+    margin-right: auto;
+}
+
+.message-avatar {
+    width: 32px;
+    height: 32px;
+    border-radius: 50%;
+    display: flex;
+    align-items: center;
+    justify-content: center;
+    margin-right: 8px;
+}
+
+.user-message .message-avatar {
+    background-color: var(--primary-color);
+    color: white;
+}
+
+.assistant-message .message-avatar {
+    background-color: var(--secondary-color);
+    color: white;
+}
+
+.message-content {
+    background-color: var(--more-accented-background-color);
+    border-radius: 12px;
+    padding: 10px 15px;
+    max-width: calc(100% - 40px);
+}
+
+.user-message .message-content {
+    background-color: var(--accented-background-color);
+}
+
+.message-content pre {
+    background-color: var(--code-background-color);
+    border-radius: 5px;
+    padding: 10px;
+    overflow-x: auto;
+    max-width: 100%;
+}
+
+.message-content code {
+    background-color: var(--code-background-color);
+    padding: 2px 4px;
+    border-radius: 3px;
+}
+
+.loading-indicator {
+    display: flex;
+    align-items: center;
+    margin: 10px 0;
+    color: var(--muted-text-color);
+}
+
+.sources-container {
+    background-color: var(--accented-background-color);
+    border-top: 1px solid var(--main-border-color);
+    padding: 8px;
+}
+
+.sources-list {
+    font-size: 0.9em;
+}
+
+.source-item {
+    padding: 4px 0;
+}
+
+.source-link {
+    color: var(--link-color);
+    text-decoration: none;
+}
+
+.source-link:hover {
+    text-decoration: underline;
+}
+
+.note-context-chat-form {
+    display: flex;
+    background-color: var(--main-background-color);
+    border-top: 1px solid var(--main-border-color);
+    padding: 10px;
+}
+
+.note-context-chat-input {
+    resize: vertical;
+    min-height: 44px;
+    max-height: 200px;
+}
+
+/* Responsive adjustments */
+@media (max-width: 768px) {
+    .chat-message {
+        max-width: 95%;
+    }
+} 
\ No newline at end of file
diff --git a/src/public/stylesheets/theme-next/pages.css b/src/public/stylesheets/theme-next/pages.css
index 7cc1ee77b..5a34b9680 100644
--- a/src/public/stylesheets/theme-next/pages.css
+++ b/src/public/stylesheets/theme-next/pages.css
@@ -257,6 +257,30 @@ div.note-detail-empty {
     font-size: .85em;
 }
 
+nav.options-section-tabs {
+    min-width: var(--options-card-min-width);
+    max-width: var(--options-card-max-width);
+    margin: auto;
+}
+
+nav.options-section-tabs .nav-tabs {
+    border-bottom: 0;
+}
+
+nav.options-section-tabs + .options-section {
+    border-top-left-radius: 0;
+    border-top-right-radius: 0;
+}
+
+/* Appeareance */
+
+.main-font-size-input-group,
+.tree-font-size-input-group,
+.detail-font-size-input-group,
+.monospace-font-size-input-group {
+    width: fit-content;
+}
+
 /* Shortcuts */
 
 .note-detail-content-widget-content:has(.shortcuts-options-section) {
diff --git a/src/public/translations/en/translation.json b/src/public/translations/en/translation.json
index ba069a4e9..6ba46d7e2 100644
--- a/src/public/translations/en/translation.json
+++ b/src/public/translations/en/translation.json
@@ -1122,6 +1122,201 @@
     "layout-vertical-description": "launcher bar is on the left (default)",
     "layout-horizontal-description": "launcher bar is underneath the tab bar, the tab bar is now full width."
   },
+  "ai_llm": {
+    "embeddings_configuration": "Embeddings Configuration",
+    "not_started": "Not started",
+    "title": "AI & Embedding Settings",
+    "embedding_statistics": "Embedding Statistics",
+    "processed_notes": "Processed Notes",
+    "total_notes": "Total Notes",
+    "progress": "Progress",
+    "queued_notes": "Queued Notes",
+    "failed_notes": "Failed Notes",
+    "last_processed": "Last Processed",
+    "refresh_stats": "Refresh Statistics",
+    "no_failed_embeddings": "No failed embeddings found.",
+    "enable_ai_features": "Enable AI/LLM features",
+    "enable_ai_description": "Enable AI features like note summarization, content generation, and other LLM capabilities",
+    "openai_tab": "OpenAI",
+    "anthropic_tab": "Anthropic",
+    "voyage_tab": "Voyage AI",
+    "ollama_tab": "Ollama",
+    "enable_ai": "Enable AI/LLM features",
+    "enable_ai_desc": "Enable AI features like note summarization, content generation, and other LLM capabilities",
+    "provider_configuration": "AI Provider Configuration",
+    "provider_precedence": "Provider Precedence",
+    "provider_precedence_description": "Comma-separated list of providers in order of precedence (e.g., 'openai,anthropic,ollama')",
+    "temperature": "Temperature",
+    "temperature_description": "Controls randomness in responses (0 = deterministic, 2 = maximum randomness)",
+    "system_prompt": "System Prompt",
+    "system_prompt_description": "Default system prompt used for all AI interactions",
+    "openai_configuration": "OpenAI Configuration",
+    "openai_settings": "OpenAI Settings",
+    "api_key": "API Key",
+    "url": "Base URL",
+    "model": "Model",
+    "openai_api_key_description": "Your OpenAI API key for accessing their AI services",
+    "anthropic_api_key_description": "Your Anthropic API key for accessing Claude models",
+    "default_model": "Default Model",
+    "openai_model_description": "Examples: gpt-4o, gpt-4-turbo, gpt-3.5-turbo",
+    "embedding_model": "Embedding Model",
+    "openai_embedding_model_description": "Model used for generating embeddings (text-embedding-3-small recommended)",
+    "base_url": "Base URL",
+    "openai_url_description": "Default: https://api.openai.com/v1",
+    "anthropic_settings": "Anthropic Settings",
+    "anthropic_url_description": "Base URL for the Anthropic API (default: https://api.anthropic.com)",
+    "anthropic_model_description": "Anthropic Claude models for chat completion",
+    "voyage_settings": "Voyage AI Settings",
+    "voyage_api_key_description": "Your Voyage AI API key for accessing embeddings services",
+    "ollama_settings": "Ollama Settings",
+    "ollama_url_description": "URL for the Ollama API (default: http://localhost:11434)",
+    "ollama_model_description": "Ollama model to use for chat completion",
+    "anthropic_configuration": "Anthropic Configuration",
+    "voyage_embedding_model_description": "Voyage AI embedding models for text embeddings (voyage-2 recommended)",
+    "voyage_configuration": "Voyage AI Configuration",
+    "voyage_url_description": "Default: https://api.voyageai.com/v1",
+    "ollama_configuration": "Ollama Configuration",
+    "enable_ollama": "Enable Ollama",
+    "enable_ollama_description": "Enable Ollama for local AI model usage",
+    "ollama_url": "Ollama URL",
+    "ollama_model": "Ollama Model",
+    "ollama_embedding_model": "Embedding Model",
+    "ollama_embedding_model_description": "Specialized model for generating embeddings (vector representations)",
+    "refresh_models": "Refresh Models",
+    "refreshing_models": "Refreshing...",
+    "embedding_configuration": "Embeddings Configuration",
+    "embedding_default_provider": "Default Provider",
+    "embedding_default_provider_description": "Select the default provider used for generating note embeddings",
+    "embedding_provider_precedence": "Embedding Provider Precedence",
+    "embedding_providers_order": "Embedding Provider Order",
+    "embedding_providers_order_description": "Set the order of embedding providers in comma-separated format (e.g., \"openai,voyage,ollama,local\")",
+    "enable_automatic_indexing": "Enable Automatic Indexing",
+    "enable_automatic_indexing_description": "Automatically generate embeddings for new and updated notes",
+    "embedding_auto_update_enabled": "Auto-update Embeddings",
+    "embedding_auto_update_enabled_description": "Automatically update embeddings when notes are modified",
+    "recreate_embeddings": "Recreate All Embeddings",
+    "recreate_embeddings_description": "Regenerate all note embeddings from scratch (may take a long time for large note collections)",
+    "recreate_embeddings_started": "Embeddings regeneration started. This may take a long time for large note collections.",
+    "recreate_embeddings_error": "Error starting embeddings regeneration. Check logs for details.",
+    "recreate_embeddings_confirm": "Are you sure you want to recreate all embeddings? This may take a long time for large note collections.",
+    "rebuild_index": "Rebuild Index",
+    "rebuild_index_description": "Rebuild the vector search index for better performance (much faster than recreating embeddings)",
+    "rebuild_index_started": "Embedding index rebuild started. This may take several minutes.",
+    "rebuild_index_error": "Error starting index rebuild. Check logs for details.",
+    "note_title": "Note Title",
+    "error": "Error",
+    "last_attempt": "Last Attempt",
+    "actions": "Actions",
+    "retry": "Retry",
+    "partial": "{{ percentage }}% completed",
+    "retry_queued": "Note queued for retry",
+    "retry_failed": "Failed to queue note for retry",
+    "embedding_provider_precedence_description": "Comma-separated list of providers in order of precedence for embeddings search (e.g., 'openai,ollama,anthropic')",
+    "embedding_dimension_strategy": "Embedding Dimension Strategy",
+    "embedding_dimension_auto": "Auto (Recommended)",
+    "embedding_dimension_fixed": "Fixed",
+    "embedding_similarity_threshold": "Similarity Threshold",
+    "embedding_similarity_threshold_description": "Minimum similarity score for notes to be included in search results (0-1)",
+    "max_notes_per_llm_query": "Max Notes Per Query",
+    "max_notes_per_llm_query_description": "Maximum number of similar notes to include in AI context",
+    "embedding_dimension_strategy_description": "Choose how embeddings are handled. 'Native' preserves maximum information by adapting smaller vectors to match larger ones (recommended). 'Regenerate' creates new embeddings with the target model for specific search needs.",
+    "drag_providers_to_reorder": "Drag providers up or down to set your preferred order for embedding searches",
+    "active_providers": "Active Providers",
+    "disabled_providers": "Disabled Providers",
+    "remove_provider": "Remove provider from search",
+    "restore_provider": "Restore provider to search",
+    "embedding_generation_location": "Generation Location",
+    "embedding_generation_location_description": "Select where embedding generation should happen",
+    "embedding_generation_location_client": "Client/Server",
+    "embedding_generation_location_sync_server": "Sync Server",
+    "enable_auto_update_embeddings": "Auto-update Embeddings",
+    "enable_auto_update_embeddings_description": "Automatically update embeddings when notes are modified",
+    "auto_update_embeddings": "Auto-update Embeddings",
+    "auto_update_embeddings_desc": "Automatically update embeddings when notes are modified",
+    "similarity_threshold": "Similarity Threshold",
+    "similarity_threshold_description": "Minimum similarity score (0-1) for notes to be included in context for LLM queries",
+    "embedding_batch_size": "Batch Size",
+    "embedding_batch_size_description": "Number of notes to process in a single batch (1-50)",
+    "embedding_update_interval": "Update Interval (ms)",
+    "embedding_update_interval_description": "Time between processing batches of embeddings (in milliseconds)",
+    "embedding_default_dimension": "Default Dimension",
+    "embedding_default_dimension_description": "Default embedding vector dimension when creating new embeddings",
+    "reprocess_all_embeddings": "Reprocess All Embeddings",
+    "reprocess_all_embeddings_description": "Queue all notes for embedding processing. This may take some time depending on your number of notes.",
+    "reprocessing_embeddings": "Reprocessing...",
+    "reprocess_started": "Embedding reprocessing started in the background",
+    "reprocess_error": "Error starting embedding reprocessing",
+
+    "reprocess_index": "Rebuild Search Index",
+    "reprocess_index_description": "Optimize the search index for better performance. This uses existing embeddings without regenerating them (much faster than reprocessing all embeddings).",
+    "reprocessing_index": "Rebuilding...",
+    "reprocess_index_started": "Search index optimization started in the background",
+    "reprocess_index_error": "Error rebuilding search index",
+
+    "index_rebuild_progress": "Index Rebuild Progress",
+    "index_rebuilding": "Optimizing index ({{percentage}}%)",
+    "index_rebuild_complete": "Index optimization complete",
+    "index_rebuild_status_error": "Error checking index rebuild status",
+    "never": "Never",
+    "processing": "Processing ({{percentage}}%)",
+    "incomplete": "Incomplete ({{percentage}}%)",
+    "complete": "Complete (100%)",
+    "refreshing": "Refreshing...",
+    "stats_error": "Error fetching embedding statistics",
+    "auto_refresh_notice": "Auto-refreshes every {{seconds}} seconds",
+    "note_queued_for_retry": "Note queued for retry",
+    "failed_to_retry_note": "Failed to retry note",
+    "all_notes_queued_for_retry": "All failed notes queued for retry",
+    "failed_to_retry_all": "Failed to retry notes",
+    "ai_settings": "AI Settings",
+    "api_key_tooltip": "API key for accessing the service",
+    "confirm_delete_embeddings": "Are you sure you want to delete all AI embeddings? This will remove all semantic search capabilities until notes are reindexed, which can take a significant amount of time.",
+    "empty_key_warning": {
+      "anthropic": "Anthropic API key is empty. Please enter a valid API key.",
+      "openai": "OpenAI API key is empty. Please enter a valid API key.",
+      "voyage": "Voyage API key is empty. Please enter a valid API key.",
+      "ollama": "Ollama API key is empty. Please enter a valid API key."
+    },
+    "agent": {
+      "processing": "Processing...",
+      "thinking": "Thinking...",
+      "loading": "Loading...",
+      "generating": "Generating..."
+    },
+    "name": "AI",
+    "openai": "OpenAI",
+    "use_enhanced_context": "Use enhanced context",
+    "enhanced_context_description": "Provides the AI with more context from the note and its related notes for better responses",
+    "show_thinking": "Show thinking",
+    "show_thinking_description": "Show the AI's chain of thought process",
+    "enter_message": "Enter your message...",
+    "error_contacting_provider": "Error contacting AI provider. Please check your settings and internet connection.",
+    "error_generating_response": "Error generating AI response",
+    "index_all_notes": "Index All Notes",
+    "index_status": "Index Status",
+    "indexed_notes": "Indexed Notes",
+    "indexing_stopped": "Indexing stopped",
+    "indexing_in_progress": "Indexing in progress...",
+    "last_indexed": "Last Indexed",
+    "n_notes_queued": "{{ count }} note queued for indexing",
+    "n_notes_queued_plural": "{{ count }} notes queued for indexing",
+    "note_chat": "Note Chat",
+    "notes_indexed": "{{ count }} note indexed",
+    "notes_indexed_plural": "{{ count }} notes indexed",
+    "reset_embeddings": "Reset Embeddings",
+    "sources": "Sources",
+    "start_indexing": "Start Indexing",
+    "use_advanced_context": "Use Advanced Context",
+    "ollama_no_url": "Ollama is not configured. Please enter a valid URL.",
+    "chat": {
+      "root_note_title": "AI Chats",
+      "root_note_content": "This note contains your saved AI chat conversations.",
+      "new_chat_title": "New Chat",
+      "create_new_ai_chat": "Create new AI Chat"
+    },
+    "create_new_ai_chat": "Create new AI Chat",
+    "configuration_warnings": "There are some issues with your AI configuration. Please check your settings."
+  },
   "zoom_factor": {
     "title": "Zoom Factor (desktop build only)",
     "description": "Zooming can be controlled with CTRL+- and CTRL+= shortcuts as well."
@@ -1474,6 +1669,7 @@
     "confirm-change": "It is not recommended to change note type when note content is not empty. Do you want to continue anyway?",
     "geo-map": "Geo Map",
     "beta-feature": "Beta",
+    "ai-chat": "AI Chat",
     "task-list": "Task List"
   },
   "protect_note": {
diff --git a/src/routes/api/anthropic.ts b/src/routes/api/anthropic.ts
new file mode 100644
index 000000000..900a0b084
--- /dev/null
+++ b/src/routes/api/anthropic.ts
@@ -0,0 +1,112 @@
+import options from "../../services/options.js";
+import log from "../../services/log.js";
+import type { Request, Response } from "express";
+import { PROVIDER_CONSTANTS } from '../../services/llm/constants/provider_constants.js';
+import Anthropic from '@anthropic-ai/sdk';
+
+// Interface for Anthropic model entries
+interface AnthropicModel {
+    id: string;
+    name: string;
+    type: string;
+}
+
+/**
+ * @swagger
+ * /api/anthropic/models:
+ *   post:
+ *     summary: List available models from Anthropic
+ *     operationId: anthropic-list-models
+ *     requestBody:
+ *       required: false
+ *       content:
+ *         application/json:
+ *           schema:
+ *             type: object
+ *             properties:
+ *               baseUrl:
+ *                 type: string
+ *                 description: Optional custom Anthropic API base URL
+ *     responses:
+ *       '200':
+ *         description: List of available Anthropic models
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *                 chatModels:
+ *                   type: array
+ *                   items:
+ *                     type: object
+ *                     properties:
+ *                       id:
+ *                         type: string
+ *                       name:
+ *                         type: string
+ *                       type:
+ *                         type: string
+ *                 embeddingModels:
+ *                   type: array
+ *                   items:
+ *                     type: object
+ *                     properties:
+ *                       id:
+ *                         type: string
+ *                       name:
+ *                         type: string
+ *                       type:
+ *                         type: string
+ *       '500':
+ *         description: Error listing models
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function listModels(req: Request, res: Response) {
+    try {
+        const { baseUrl } = req.body;
+
+        // Use provided base URL or default from options
+        const anthropicBaseUrl = baseUrl ||
+            await options.getOption('anthropicBaseUrl') ||
+            PROVIDER_CONSTANTS.ANTHROPIC.BASE_URL;
+
+        const apiKey = await options.getOption('anthropicApiKey');
+
+        if (!apiKey) {
+            throw new Error('Anthropic API key is not configured');
+        }
+
+        log.info(`Using predefined Anthropic models list (avoiding direct API call)`);
+
+        // Instead of using the SDK's built-in models listing which might not work,
+        // directly use the predefined available models
+        const chatModels = PROVIDER_CONSTANTS.ANTHROPIC.AVAILABLE_MODELS.map(model => ({
+            id: model.id,
+            name: model.name,
+            type: 'chat'
+        }));
+
+        // Anthropic doesn't currently have embedding models
+        const embeddingModels: AnthropicModel[] = [];
+
+        // Return the models list
+        return {
+            success: true,
+            chatModels,
+            embeddingModels
+        };
+    } catch (error: any) {
+        log.error(`Error listing Anthropic models: ${error.message || 'Unknown error'}`);
+
+        // Properly throw the error to be handled by the global error handler
+        throw new Error(`Failed to list Anthropic models: ${error.message || 'Unknown error'}`);
+    }
+}
+
+export default {
+    listModels
+};
diff --git a/src/routes/api/embeddings.ts b/src/routes/api/embeddings.ts
new file mode 100644
index 000000000..012a9c82f
--- /dev/null
+++ b/src/routes/api/embeddings.ts
@@ -0,0 +1,798 @@
+import options from "../../services/options.js";
+import vectorStore from "../../services/llm/embeddings/index.js";
+import providerManager from "../../services/llm/providers/providers.js";
+import indexService from "../../services/llm/index_service.js";
+import becca from "../../becca/becca.js";
+import type { Request, Response } from "express";
+import log from "../../services/log.js";
+import sql from "../../services/sql.js";
+
+/**
+ * @swagger
+ * /api/llm/embeddings/similar/{noteId}:
+ *   get:
+ *     summary: Find similar notes based on a given note ID
+ *     operationId: embeddings-similar-by-note
+ *     parameters:
+ *       - name: noteId
+ *         in: path
+ *         required: true
+ *         schema:
+ *           type: string
+ *       - name: providerId
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: string
+ *         default: openai
+ *         description: Embedding provider ID
+ *       - name: modelId
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: string
+ *         default: text-embedding-3-small
+ *         description: Embedding model ID
+ *       - name: limit
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: integer
+ *         default: 10
+ *         description: Maximum number of similar notes to return
+ *       - name: threshold
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: number
+ *           format: float
+ *         default: 0.7
+ *         description: Similarity threshold (0.0-1.0)
+ *     responses:
+ *       '200':
+ *         description: List of similar notes
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *                 similarNotes:
+ *                   type: array
+ *                   items:
+ *                     type: object
+ *                     properties:
+ *                       noteId:
+ *                         type: string
+ *                       title:
+ *                         type: string
+ *                       similarity:
+ *                         type: number
+ *                         format: float
+ *       '400':
+ *         description: Invalid request parameters
+ *       '404':
+ *         description: Note not found
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function findSimilarNotes(req: Request, res: Response) {
+    const noteId = req.params.noteId;
+    const providerId = req.query.providerId as string || 'openai';
+    const modelId = req.query.modelId as string || 'text-embedding-3-small';
+    const limit = parseInt(req.query.limit as string || '10', 10);
+    const threshold = parseFloat(req.query.threshold as string || '0.7');
+
+    if (!noteId) {
+        return [400, {
+            success: false,
+            message: "Note ID is required"
+        }];
+    }
+
+    const embedding = await vectorStore.getEmbeddingForNote(noteId, providerId, modelId);
+
+    if (!embedding) {
+        // If no embedding exists for this note yet, generate one
+        const note = becca.getNote(noteId);
+        if (!note) {
+            return [404, {
+                success: false,
+                message: "Note not found"
+            }];
+        }
+
+        const context = await vectorStore.getNoteEmbeddingContext(noteId);
+        const provider = providerManager.getEmbeddingProvider(providerId);
+
+        if (!provider) {
+            return [400, {
+                success: false,
+                message: `Embedding provider '${providerId}' not found`
+            }];
+        }
+
+        const newEmbedding = await provider.generateNoteEmbeddings(context);
+        await vectorStore.storeNoteEmbedding(noteId, providerId, modelId, newEmbedding);
+
+        const similarNotes = await vectorStore.findSimilarNotes(
+            newEmbedding, providerId, modelId, limit, threshold
+        );
+
+        return {
+            success: true,
+            similarNotes
+        };
+    }
+
+    const similarNotes = await vectorStore.findSimilarNotes(
+        embedding.embedding, providerId, modelId, limit, threshold
+    );
+
+    return {
+        success: true,
+        similarNotes
+    };
+}
+
+/**
+ * @swagger
+ * /api/llm/embeddings/search:
+ *   post:
+ *     summary: Search for notes similar to provided text
+ *     operationId: embeddings-search-by-text
+ *     parameters:
+ *       - name: providerId
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: string
+ *         default: openai
+ *         description: Embedding provider ID
+ *       - name: modelId
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: string
+ *         default: text-embedding-3-small
+ *         description: Embedding model ID
+ *       - name: limit
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: integer
+ *         default: 10
+ *         description: Maximum number of similar notes to return
+ *       - name: threshold
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: number
+ *           format: float
+ *         default: 0.7
+ *         description: Similarity threshold (0.0-1.0)
+ *     requestBody:
+ *       required: true
+ *       content:
+ *         application/json:
+ *           schema:
+ *             type: object
+ *             properties:
+ *               text:
+ *                 type: string
+ *                 description: Text to search with
+ *     responses:
+ *       '200':
+ *         description: List of similar notes
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *                 similarNotes:
+ *                   type: array
+ *                   items:
+ *                     type: object
+ *                     properties:
+ *                       noteId:
+ *                         type: string
+ *                       title:
+ *                         type: string
+ *                       similarity:
+ *                         type: number
+ *                         format: float
+ *       '400':
+ *         description: Invalid request parameters
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function searchByText(req: Request, res: Response) {
+    const { text } = req.body;
+    const providerId = req.query.providerId as string || 'openai';
+    const modelId = req.query.modelId as string || 'text-embedding-3-small';
+    const limit = parseInt(req.query.limit as string || '10', 10);
+    const threshold = parseFloat(req.query.threshold as string || '0.7');
+
+    if (!text) {
+        return [400, {
+            success: false,
+            message: "Search text is required"
+        }];
+    }
+
+    const provider = providerManager.getEmbeddingProvider(providerId);
+
+    if (!provider) {
+        return [400, {
+            success: false,
+            message: `Embedding provider '${providerId}' not found`
+        }];
+    }
+
+    // Generate embedding for the search text
+    const embedding = await provider.generateEmbeddings(text);
+
+    // Find similar notes
+    const similarNotes = await vectorStore.findSimilarNotes(
+        embedding, providerId, modelId, limit, threshold
+    );
+
+    return {
+        success: true,
+        similarNotes
+    };
+}
+
+/**
+ * @swagger
+ * /api/llm/embeddings/providers:
+ *   get:
+ *     summary: Get available embedding providers
+ *     operationId: embeddings-get-providers
+ *     responses:
+ *       '200':
+ *         description: List of available embedding providers
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *                 providers:
+ *                   type: array
+ *                   items:
+ *                     type: object
+ *                     properties:
+ *                       id:
+ *                         type: string
+ *                       name:
+ *                         type: string
+ *                       isEnabled:
+ *                         type: boolean
+ *                       priority:
+ *                         type: integer
+ *                       config:
+ *                         type: object
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function getProviders(req: Request, res: Response) {
+    const providerConfigs = await providerManager.getEmbeddingProviderConfigs();
+
+    return {
+        success: true,
+        providers: providerConfigs
+    };
+}
+
+/**
+ * @swagger
+ * /api/llm/embeddings/providers/{providerId}:
+ *   patch:
+ *     summary: Update embedding provider configuration
+ *     operationId: embeddings-update-provider
+ *     parameters:
+ *       - name: providerId
+ *         in: path
+ *         required: true
+ *         schema:
+ *           type: string
+ *         description: Provider ID to update
+ *     requestBody:
+ *       required: true
+ *       content:
+ *         application/json:
+ *           schema:
+ *             type: object
+ *             properties:
+ *               enabled:
+ *                 type: boolean
+ *                 description: Whether provider is enabled
+ *               priority:
+ *                 type: integer
+ *                 description: Priority order (lower is higher priority)
+ *               config:
+ *                 type: object
+ *                 description: Provider-specific configuration
+ *     responses:
+ *       '200':
+ *         description: Provider updated successfully
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *       '400':
+ *         description: Invalid provider ID or configuration
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function updateProvider(req: Request, res: Response) {
+    const { providerId } = req.params;
+    const { isEnabled, priority, config } = req.body;
+
+    const success = await providerManager.updateEmbeddingProviderConfig(
+        providerId, isEnabled, priority
+    );
+
+    if (!success) {
+        return [404, {
+            success: false,
+            message: "Provider not found"
+        }];
+    }
+
+    return {
+        success: true
+    };
+}
+
+/**
+ * @swagger
+ * /api/llm/embeddings/reprocess:
+ *   post:
+ *     summary: Reprocess embeddings for all notes
+ *     operationId: embeddings-reprocess-all
+ *     requestBody:
+ *       required: true
+ *       content:
+ *         application/json:
+ *           schema:
+ *             type: object
+ *             properties:
+ *               providerId:
+ *                 type: string
+ *                 description: Provider ID to use for reprocessing
+ *               modelId:
+ *                 type: string
+ *                 description: Model ID to use for reprocessing
+ *               forceReprocess:
+ *                 type: boolean
+ *                 description: Whether to reprocess notes that already have embeddings
+ *     responses:
+ *       '200':
+ *         description: Reprocessing started
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *                 jobId:
+ *                   type: string
+ *                 message:
+ *                   type: string
+ *       '400':
+ *         description: Invalid provider ID or configuration
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function reprocessAllNotes(req: Request, res: Response) {
+    // Import cls
+    const cls = (await import("../../services/cls.js")).default;
+
+    // Start the reprocessing operation in the background
+    setTimeout(async () => {
+        try {
+            // Wrap the operation in cls.init to ensure proper context
+            cls.init(async () => {
+                await vectorStore.reprocessAllNotes();
+                log.info("Embedding reprocessing completed successfully");
+            });
+        } catch (error: any) {
+            log.error(`Error during background embedding reprocessing: ${error.message || "Unknown error"}`);
+        }
+    }, 0);
+
+    // Return the response data
+    return {
+        success: true,
+        message: "Embedding reprocessing started in the background"
+    };
+}
+
+/**
+ * @swagger
+ * /api/llm/embeddings/queue-status:
+ *   get:
+ *     summary: Get status of the embedding processing queue
+ *     operationId: embeddings-queue-status
+ *     parameters:
+ *       - name: jobId
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: string
+ *         description: Optional job ID to get status for a specific processing job
+ *     responses:
+ *       '200':
+ *         description: Queue status information
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *                 status:
+ *                   type: string
+ *                   enum: [idle, processing, paused]
+ *                 progress:
+ *                   type: number
+ *                   format: float
+ *                   description: Progress percentage (0-100)
+ *                 details:
+ *                   type: object
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function getQueueStatus(req: Request, res: Response) {
+    // Use the imported sql instead of requiring it
+    const queueCount = await sql.getValue(
+        "SELECT COUNT(*) FROM embedding_queue"
+    );
+
+    const failedCount = await sql.getValue(
+        "SELECT COUNT(*) FROM embedding_queue WHERE attempts > 0"
+    );
+
+    const totalEmbeddingsCount = await sql.getValue(
+        "SELECT COUNT(*) FROM note_embeddings"
+    );
+
+    return {
+        success: true,
+        status: {
+            queueCount,
+            failedCount,
+            totalEmbeddingsCount
+        }
+    };
+}
+
+/**
+ * @swagger
+ * /api/llm/embeddings/stats:
+ *   get:
+ *     summary: Get embedding statistics
+ *     operationId: embeddings-stats
+ *     responses:
+ *       '200':
+ *         description: Embedding statistics
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *                 stats:
+ *                   type: object
+ *                   properties:
+ *                     totalEmbeddings:
+ *                       type: integer
+ *                     providers:
+ *                       type: object
+ *                     modelCounts:
+ *                       type: object
+ *                     lastUpdated:
+ *                       type: string
+ *                       format: date-time
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function getEmbeddingStats(req: Request, res: Response) {
+    const stats = await vectorStore.getEmbeddingStats();
+
+    return {
+        success: true,
+        stats
+    };
+}
+
+/**
+ * @swagger
+ * /api/llm/embeddings/failed:
+ *   get:
+ *     summary: Get list of notes that failed embedding generation
+ *     operationId: embeddings-failed-notes
+ *     responses:
+ *       '200':
+ *         description: List of failed notes
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *                 failedNotes:
+ *                   type: array
+ *                   items:
+ *                     type: object
+ *                     properties:
+ *                       noteId:
+ *                         type: string
+ *                       title:
+ *                         type: string
+ *                       error:
+ *                         type: string
+ *                       failedAt:
+ *                         type: string
+ *                         format: date-time
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function getFailedNotes(req: Request, res: Response) {
+    const limit = parseInt(req.query.limit as string || '100', 10);
+    const failedNotes = await vectorStore.getFailedEmbeddingNotes(limit);
+
+    // No need to fetch note titles here anymore as they're already included in the response
+    return {
+        success: true,
+        failedNotes: failedNotes
+    };
+}
+
+/**
+ * @swagger
+ * /api/llm/embeddings/retry/{noteId}:
+ *   post:
+ *     summary: Retry generating embeddings for a failed note
+ *     operationId: embeddings-retry-note
+ *     parameters:
+ *       - name: noteId
+ *         in: path
+ *         required: true
+ *         schema:
+ *           type: string
+ *         description: Note ID to retry
+ *       - name: providerId
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: string
+ *         description: Provider ID to use (defaults to configured default)
+ *       - name: modelId
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: string
+ *         description: Model ID to use (defaults to provider default)
+ *     responses:
+ *       '200':
+ *         description: Retry result
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *                 message:
+ *                   type: string
+ *       '400':
+ *         description: Invalid request
+ *       '404':
+ *         description: Note not found
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function retryFailedNote(req: Request, res: Response) {
+    const { noteId } = req.params;
+
+    if (!noteId) {
+        return [400, {
+            success: false,
+            message: "Note ID is required"
+        }];
+    }
+
+    const success = await vectorStore.retryFailedEmbedding(noteId);
+
+    if (!success) {
+        return [404, {
+            success: false,
+            message: "Failed note not found or note is not marked as failed"
+        }];
+    }
+
+    return {
+        success: true,
+        message: "Note queued for retry"
+    };
+}
+
+/**
+ * @swagger
+ * /api/llm/embeddings/retry-all-failed:
+ *   post:
+ *     summary: Retry generating embeddings for all failed notes
+ *     operationId: embeddings-retry-all-failed
+ *     requestBody:
+ *       required: false
+ *       content:
+ *         application/json:
+ *           schema:
+ *             type: object
+ *             properties:
+ *               providerId:
+ *                 type: string
+ *                 description: Provider ID to use (defaults to configured default)
+ *               modelId:
+ *                 type: string
+ *                 description: Model ID to use (defaults to provider default)
+ *     responses:
+ *       '200':
+ *         description: Retry started
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *                 message:
+ *                   type: string
+ *                 jobId:
+ *                   type: string
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function retryAllFailedNotes(req: Request, res: Response) {
+    const count = await vectorStore.retryAllFailedEmbeddings();
+
+    return {
+        success: true,
+        message: `${count} failed notes queued for retry`
+    };
+}
+
+/**
+ * @swagger
+ * /api/llm/embeddings/rebuild-index:
+ *   post:
+ *     summary: Rebuild the vector store index
+ *     operationId: embeddings-rebuild-index
+ *     responses:
+ *       '200':
+ *         description: Rebuild started
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *                 message:
+ *                   type: string
+ *                 jobId:
+ *                   type: string
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function rebuildIndex(req: Request, res: Response) {
+    // Start the index rebuilding operation in the background
+    setTimeout(async () => {
+        try {
+            await indexService.startFullIndexing(true);
+            log.info("Index rebuilding completed successfully");
+        } catch (error: any) {
+            log.error(`Error during background index rebuilding: ${error.message || "Unknown error"}`);
+        }
+    }, 0);
+
+    // Return the response data
+    return {
+        success: true,
+        message: "Index rebuilding started in the background"
+    };
+}
+
+/**
+ * @swagger
+ * /api/llm/embeddings/index-rebuild-status:
+ *   get:
+ *     summary: Get status of the vector index rebuild operation
+ *     operationId: embeddings-rebuild-status
+ *     parameters:
+ *       - name: jobId
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: string
+ *         description: Optional job ID to get status for a specific rebuild job
+ *     responses:
+ *       '200':
+ *         description: Rebuild status information
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *                 status:
+ *                   type: string
+ *                   enum: [idle, in_progress, completed, failed]
+ *                 progress:
+ *                   type: number
+ *                   format: float
+ *                   description: Progress percentage (0-100)
+ *                 message:
+ *                   type: string
+ *                 details:
+ *                   type: object
+ *                   properties:
+ *                     startTime:
+ *                       type: string
+ *                       format: date-time
+ *                     processed:
+ *                       type: integer
+ *                     total:
+ *                       type: integer
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function getIndexRebuildStatus(req: Request, res: Response) {
+    const status = indexService.getIndexRebuildStatus();
+
+    return {
+        success: true,
+        status
+    };
+}
+
+export default {
+    findSimilarNotes,
+    searchByText,
+    getProviders,
+    updateProvider,
+    reprocessAllNotes,
+    getQueueStatus,
+    getEmbeddingStats,
+    getFailedNotes,
+    retryFailedNote,
+    retryAllFailedNotes,
+    rebuildIndex,
+    getIndexRebuildStatus
+};
diff --git a/src/routes/api/llm.ts b/src/routes/api/llm.ts
new file mode 100644
index 000000000..adda7cd26
--- /dev/null
+++ b/src/routes/api/llm.ts
@@ -0,0 +1,944 @@
+import type { Request, Response } from "express";
+import log from "../../services/log.js";
+import options from "../../services/options.js";
+
+// Import the index service for knowledge base management
+import indexService from "../../services/llm/index_service.js";
+import restChatService from "../../services/llm/rest_chat_service.js";
+import chatService from '../../services/llm/chat_service.js';
+import chatStorageService from '../../services/llm/chat_storage_service.js';
+
+// Define basic interfaces
+interface ChatMessage {
+    role: 'user' | 'assistant' | 'system';
+    content: string;
+    timestamp?: Date;
+}
+
+
+
+/**
+ * @swagger
+ * /api/llm/sessions:
+ *   post:
+ *     summary: Create a new LLM chat session
+ *     operationId: llm-create-session
+ *     requestBody:
+ *       required: true
+ *       content:
+ *         application/json:
+ *           schema:
+ *             type: object
+ *             properties:
+ *               title:
+ *                 type: string
+ *                 description: Title for the chat session
+ *               systemPrompt:
+ *                 type: string
+ *                 description: System message to set the behavior of the assistant
+ *               temperature:
+ *                 type: number
+ *                 description: Temperature parameter for the LLM (0.0-1.0)
+ *               maxTokens:
+ *                 type: integer
+ *                 description: Maximum tokens to generate in responses
+ *               model:
+ *                 type: string
+ *                 description: Specific model to use (depends on provider)
+ *               provider:
+ *                 type: string
+ *                 description: LLM provider to use (e.g., 'openai', 'anthropic', 'ollama')
+ *               contextNoteId:
+ *                 type: string
+ *                 description: Note ID to use as context for the session
+ *     responses:
+ *       '200':
+ *         description: Successfully created session
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 sessionId:
+ *                   type: string
+ *                 title:
+ *                   type: string
+ *                 createdAt:
+ *                   type: string
+ *                   format: date-time
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function createSession(req: Request, res: Response) {
+    return restChatService.createSession(req, res);
+}
+
+/**
+ * @swagger
+ * /api/llm/sessions/{sessionId}:
+ *   get:
+ *     summary: Retrieve a specific chat session
+ *     operationId: llm-get-session
+ *     parameters:
+ *       - name: sessionId
+ *         in: path
+ *         required: true
+ *         schema:
+ *           type: string
+ *     responses:
+ *       '200':
+ *         description: Chat session details
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 id:
+ *                   type: string
+ *                 title:
+ *                   type: string
+ *                 messages:
+ *                   type: array
+ *                   items:
+ *                     type: object
+ *                     properties:
+ *                       role:
+ *                         type: string
+ *                         enum: [user, assistant, system]
+ *                       content:
+ *                         type: string
+ *                       timestamp:
+ *                         type: string
+ *                         format: date-time
+ *                 createdAt:
+ *                   type: string
+ *                   format: date-time
+ *                 lastActive:
+ *                   type: string
+ *                   format: date-time
+ *       '404':
+ *         description: Session not found
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function getSession(req: Request, res: Response) {
+    return restChatService.getSession(req, res);
+}
+
+/**
+ * @swagger
+ * /api/llm/chat/{chatNoteId}:
+ *   patch:
+ *     summary: Update a chat's settings
+ *     operationId: llm-update-chat
+ *     parameters:
+ *       - name: chatNoteId
+ *         in: path
+ *         required: true
+ *         schema:
+ *           type: string
+ *         description: The ID of the chat note (formerly sessionId)
+ *     requestBody:
+ *       required: true
+ *       content:
+ *         application/json:
+ *           schema:
+ *             type: object
+ *             properties:
+ *               title:
+ *                 type: string
+ *                 description: Updated title for the session
+ *               systemPrompt:
+ *                 type: string
+ *                 description: Updated system prompt
+ *               temperature:
+ *                 type: number
+ *                 description: Updated temperature setting
+ *               maxTokens:
+ *                 type: integer
+ *                 description: Updated maximum tokens setting
+ *               model:
+ *                 type: string
+ *                 description: Updated model selection
+ *               provider:
+ *                 type: string
+ *                 description: Updated provider selection
+ *               contextNoteId:
+ *                 type: string
+ *                 description: Updated note ID for context
+ *     responses:
+ *       '200':
+ *         description: Session successfully updated
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 id:
+ *                   type: string
+ *                 title:
+ *                   type: string
+ *                 updatedAt:
+ *                   type: string
+ *                   format: date-time
+ *       '404':
+ *         description: Session not found
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function updateSession(req: Request, res: Response) {
+    // Get the chat using ChatService
+    const chatNoteId = req.params.chatNoteId;
+    const updates = req.body;
+
+    try {
+        // Get the chat
+        const session = await chatService.getOrCreateSession(chatNoteId);
+
+        // Update title if provided
+        if (updates.title) {
+            await chatStorageService.updateChat(chatNoteId, session.messages, updates.title);
+        }
+
+        // Return the updated chat
+        return {
+            id: chatNoteId,
+            title: updates.title || session.title,
+            updatedAt: new Date()
+        };
+    } catch (error) {
+        log.error(`Error updating chat: ${error}`);
+        throw new Error(`Failed to update chat: ${error}`);
+    }
+}
+
+/**
+ * @swagger
+ * /api/llm/sessions:
+ *   get:
+ *     summary: List all chat sessions
+ *     operationId: llm-list-sessions
+ *     responses:
+ *       '200':
+ *         description: List of chat sessions
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: array
+ *               items:
+ *                 type: object
+ *                 properties:
+ *                   id:
+ *                     type: string
+ *                   title:
+ *                     type: string
+ *                   createdAt:
+ *                     type: string
+ *                     format: date-time
+ *                   lastActive:
+ *                     type: string
+ *                     format: date-time
+ *                   messageCount:
+ *                     type: integer
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function listSessions(req: Request, res: Response) {
+    // Get all sessions using ChatService
+    try {
+        const sessions = await chatService.getAllSessions();
+
+        // Format the response
+        return {
+            sessions: sessions.map(session => ({
+                id: session.id,
+                title: session.title,
+                createdAt: new Date(), // Since we don't have this in chat sessions
+                lastActive: new Date(), // Since we don't have this in chat sessions
+                messageCount: session.messages.length
+            }))
+        };
+    } catch (error) {
+        log.error(`Error listing sessions: ${error}`);
+        throw new Error(`Failed to list sessions: ${error}`);
+    }
+}
+
+/**
+ * @swagger
+ * /api/llm/sessions/{sessionId}:
+ *   delete:
+ *     summary: Delete a chat session
+ *     operationId: llm-delete-session
+ *     parameters:
+ *       - name: sessionId
+ *         in: path
+ *         required: true
+ *         schema:
+ *           type: string
+ *     responses:
+ *       '200':
+ *         description: Session successfully deleted
+ *       '404':
+ *         description: Session not found
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function deleteSession(req: Request, res: Response) {
+    return restChatService.deleteSession(req, res);
+}
+
+/**
+ * @swagger
+ * /api/llm/chat/{chatNoteId}/messages:
+ *   post:
+ *     summary: Send a message to an LLM and get a response
+ *     operationId: llm-send-message
+ *     parameters:
+ *       - name: chatNoteId
+ *         in: path
+ *         required: true
+ *         schema:
+ *           type: string
+ *         description: The ID of the chat note (formerly sessionId)
+ *     requestBody:
+ *       required: true
+ *       content:
+ *         application/json:
+ *           schema:
+ *             type: object
+ *             properties:
+ *               message:
+ *                 type: string
+ *                 description: The user message to send to the LLM
+ *               options:
+ *                 type: object
+ *                 description: Optional parameters for this specific message
+ *                 properties:
+ *                   temperature:
+ *                     type: number
+ *                   maxTokens:
+ *                     type: integer
+ *                   model:
+ *                     type: string
+ *                   provider:
+ *                     type: string
+ *               includeContext:
+ *                 type: boolean
+ *                 description: Whether to include relevant notes as context
+ *               useNoteContext:
+ *                 type: boolean
+ *                 description: Whether to use the session's context note
+ *     responses:
+ *       '200':
+ *         description: LLM response
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 response:
+ *                   type: string
+ *                 sources:
+ *                   type: array
+ *                   items:
+ *                     type: object
+ *                     properties:
+ *                       noteId:
+ *                         type: string
+ *                       title:
+ *                         type: string
+ *                       similarity:
+ *                         type: number
+ *                 sessionId:
+ *                   type: string
+ *       '404':
+ *         description: Session not found
+ *       '500':
+ *         description: Error processing request
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function sendMessage(req: Request, res: Response) {
+    return restChatService.handleSendMessage(req, res);
+}
+
+/**
+ * @swagger
+ * /api/llm/indexes/stats:
+ *   get:
+ *     summary: Get stats about the LLM knowledge base indexing status
+ *     operationId: llm-index-stats
+ *     responses:
+ *       '200':
+ *         description: Index stats successfully retrieved
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function getIndexStats(req: Request, res: Response) {
+    try {
+        // Check if AI is enabled
+        const aiEnabled = await options.getOptionBool('aiEnabled');
+        if (!aiEnabled) {
+            return {
+                success: false,
+                message: "AI features are disabled"
+            };
+        }
+
+        // Return indexing stats
+        const stats = await indexService.getIndexingStats();
+        return {
+            success: true,
+            ...stats
+        };
+    } catch (error: any) {
+        log.error(`Error getting index stats: ${error.message || 'Unknown error'}`);
+        throw new Error(`Failed to get index stats: ${error.message || 'Unknown error'}`);
+    }
+}
+
+/**
+ * @swagger
+ * /api/llm/indexes:
+ *   post:
+ *     summary: Start or continue indexing the knowledge base
+ *     operationId: llm-start-indexing
+ *     requestBody:
+ *       required: false
+ *       content:
+ *         application/json:
+ *           schema:
+ *             type: object
+ *             properties:
+ *               force:
+ *                 type: boolean
+ *                 description: Whether to force reindexing of all notes
+ *     responses:
+ *       '200':
+ *         description: Indexing started successfully
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function startIndexing(req: Request, res: Response) {
+    try {
+        // Check if AI is enabled
+        const aiEnabled = await options.getOptionBool('aiEnabled');
+        if (!aiEnabled) {
+            return {
+                success: false,
+                message: "AI features are disabled"
+            };
+        }
+
+        const { force = false } = req.body;
+
+        // Start indexing
+        await indexService.startFullIndexing(force);
+
+        return {
+            success: true,
+            message: "Indexing started"
+        };
+    } catch (error: any) {
+        log.error(`Error starting indexing: ${error.message || 'Unknown error'}`);
+        throw new Error(`Failed to start indexing: ${error.message || 'Unknown error'}`);
+    }
+}
+
+/**
+ * @swagger
+ * /api/llm/indexes/failed:
+ *   get:
+ *     summary: Get list of notes that failed to index
+ *     operationId: llm-failed-indexes
+ *     parameters:
+ *       - name: limit
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: integer
+ *           default: 100
+ *     responses:
+ *       '200':
+ *         description: Failed indexes successfully retrieved
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function getFailedIndexes(req: Request, res: Response) {
+    try {
+        // Check if AI is enabled
+        const aiEnabled = await options.getOptionBool('aiEnabled');
+        if (!aiEnabled) {
+            return {
+                success: false,
+                message: "AI features are disabled"
+            };
+        }
+
+        const limit = parseInt(req.query.limit as string || "100", 10);
+
+        // Get failed indexes
+        const failed = await indexService.getFailedIndexes(limit);
+
+        return {
+            success: true,
+            failed
+        };
+    } catch (error: any) {
+        log.error(`Error getting failed indexes: ${error.message || 'Unknown error'}`);
+        throw new Error(`Failed to get failed indexes: ${error.message || 'Unknown error'}`);
+    }
+}
+
+/**
+ * @swagger
+ * /api/llm/indexes/notes/{noteId}:
+ *   put:
+ *     summary: Retry indexing a specific note that previously failed
+ *     operationId: llm-retry-index
+ *     parameters:
+ *       - name: noteId
+ *         in: path
+ *         required: true
+ *         schema:
+ *           type: string
+ *     responses:
+ *       '200':
+ *         description: Index retry successfully initiated
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function retryFailedIndex(req: Request, res: Response) {
+    try {
+        // Check if AI is enabled
+        const aiEnabled = await options.getOptionBool('aiEnabled');
+        if (!aiEnabled) {
+            return {
+                success: false,
+                message: "AI features are disabled"
+            };
+        }
+
+        const { noteId } = req.params;
+
+        // Retry indexing the note
+        const result = await indexService.retryFailedNote(noteId);
+
+        return {
+            success: true,
+            message: result ? "Note queued for indexing" : "Failed to queue note for indexing"
+        };
+    } catch (error: any) {
+        log.error(`Error retrying failed index: ${error.message || 'Unknown error'}`);
+        throw new Error(`Failed to retry index: ${error.message || 'Unknown error'}`);
+    }
+}
+
+/**
+ * @swagger
+ * /api/llm/indexes/failed:
+ *   put:
+ *     summary: Retry indexing all failed notes
+ *     operationId: llm-retry-all-indexes
+ *     responses:
+ *       '200':
+ *         description: Retry of all failed indexes successfully initiated
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function retryAllFailedIndexes(req: Request, res: Response) {
+    try {
+        // Check if AI is enabled
+        const aiEnabled = await options.getOptionBool('aiEnabled');
+        if (!aiEnabled) {
+            return {
+                success: false,
+                message: "AI features are disabled"
+            };
+        }
+
+        // Retry all failed notes
+        const count = await indexService.retryAllFailedNotes();
+
+        return {
+            success: true,
+            message: `${count} notes queued for reprocessing`
+        };
+    } catch (error: any) {
+        log.error(`Error retrying all failed indexes: ${error.message || 'Unknown error'}`);
+        throw new Error(`Failed to retry all indexes: ${error.message || 'Unknown error'}`);
+    }
+}
+
+/**
+ * @swagger
+ * /api/llm/indexes/notes/similar:
+ *   get:
+ *     summary: Find notes similar to a query string
+ *     operationId: llm-find-similar-notes
+ *     parameters:
+ *       - name: query
+ *         in: query
+ *         required: true
+ *         schema:
+ *           type: string
+ *       - name: contextNoteId
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: string
+ *       - name: limit
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: integer
+ *           default: 5
+ *     responses:
+ *       '200':
+ *         description: Similar notes found successfully
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function findSimilarNotes(req: Request, res: Response) {
+    try {
+        // Check if AI is enabled
+        const aiEnabled = await options.getOptionBool('aiEnabled');
+        if (!aiEnabled) {
+            return {
+                success: false,
+                message: "AI features are disabled"
+            };
+        }
+
+        const query = req.query.query as string;
+        const contextNoteId = req.query.contextNoteId as string | undefined;
+        const limit = parseInt(req.query.limit as string || "5", 10);
+
+        if (!query) {
+            return {
+                success: false,
+                message: "Query is required"
+            };
+        }
+
+        // Find similar notes
+        const similar = await indexService.findSimilarNotes(query, contextNoteId, limit);
+
+        return {
+            success: true,
+            similar
+        };
+    } catch (error: any) {
+        log.error(`Error finding similar notes: ${error.message || 'Unknown error'}`);
+        throw new Error(`Failed to find similar notes: ${error.message || 'Unknown error'}`);
+    }
+}
+
+/**
+ * @swagger
+ * /api/llm/indexes/context:
+ *   get:
+ *     summary: Generate context for an LLM query based on the knowledge base
+ *     operationId: llm-generate-context
+ *     parameters:
+ *       - name: query
+ *         in: query
+ *         required: true
+ *         schema:
+ *           type: string
+ *       - name: contextNoteId
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: string
+ *       - name: depth
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: integer
+ *           default: 2
+ *     responses:
+ *       '200':
+ *         description: Context generated successfully
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function generateQueryContext(req: Request, res: Response) {
+    try {
+        // Check if AI is enabled
+        const aiEnabled = await options.getOptionBool('aiEnabled');
+        if (!aiEnabled) {
+            return {
+                success: false,
+                message: "AI features are disabled"
+            };
+        }
+
+        const query = req.query.query as string;
+        const contextNoteId = req.query.contextNoteId as string | undefined;
+        const depth = parseInt(req.query.depth as string || "2", 10);
+
+        if (!query) {
+            return {
+                success: false,
+                message: "Query is required"
+            };
+        }
+
+        // Generate context
+        const context = await indexService.generateQueryContext(query, contextNoteId, depth);
+
+        return {
+            success: true,
+            context
+        };
+    } catch (error: any) {
+        log.error(`Error generating query context: ${error.message || 'Unknown error'}`);
+        throw new Error(`Failed to generate query context: ${error.message || 'Unknown error'}`);
+    }
+}
+
+/**
+ * @swagger
+ * /api/llm/indexes/notes/{noteId}:
+ *   post:
+ *     summary: Index a specific note for LLM knowledge base
+ *     operationId: llm-index-note
+ *     parameters:
+ *       - name: noteId
+ *         in: path
+ *         required: true
+ *         schema:
+ *           type: string
+ *     responses:
+ *       '200':
+ *         description: Note indexed successfully
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function indexNote(req: Request, res: Response) {
+    try {
+        // Check if AI is enabled
+        const aiEnabled = await options.getOptionBool('aiEnabled');
+        if (!aiEnabled) {
+            return {
+                success: false,
+                message: "AI features are disabled"
+            };
+        }
+
+        const { noteId } = req.params;
+
+        if (!noteId) {
+            return {
+                success: false,
+                message: "Note ID is required"
+            };
+        }
+
+        // Index the note
+        const result = await indexService.generateNoteIndex(noteId);
+
+        return {
+            success: true,
+            message: result ? "Note indexed successfully" : "Failed to index note"
+        };
+    } catch (error: any) {
+        log.error(`Error indexing note: ${error.message || 'Unknown error'}`);
+        throw new Error(`Failed to index note: ${error.message || 'Unknown error'}`);
+    }
+}
+
+/**
+ * @swagger
+ * /api/llm/chat/{chatNoteId}/messages/stream:
+ *   post:
+ *     summary: Stream a message to an LLM via WebSocket
+ *     operationId: llm-stream-message
+ *     parameters:
+ *       - name: chatNoteId
+ *         in: path
+ *         required: true
+ *         schema:
+ *           type: string
+ *         description: The ID of the chat note to stream messages to (formerly sessionId)
+ *     requestBody:
+ *       required: true
+ *       content:
+ *         application/json:
+ *           schema:
+ *             type: object
+ *             properties:
+ *               content:
+ *                 type: string
+ *                 description: The user message to send to the LLM
+ *               useAdvancedContext:
+ *                 type: boolean
+ *                 description: Whether to use advanced context extraction
+ *               showThinking:
+ *                 type: boolean
+ *                 description: Whether to show thinking process in the response
+ *     responses:
+ *       '200':
+ *         description: Streaming started successfully
+ *       '404':
+ *         description: Session not found
+ *       '500':
+ *         description: Error processing request
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function streamMessage(req: Request, res: Response) {
+    log.info("=== Starting streamMessage ===");
+    try {
+        const chatNoteId = req.params.chatNoteId;
+        const { content, useAdvancedContext, showThinking } = req.body;
+
+        if (!content || typeof content !== 'string' || content.trim().length === 0) {
+            throw new Error('Content cannot be empty');
+        }
+
+        // Check if session exists
+        const session = restChatService.getSessions().get(chatNoteId);
+        if (!session) {
+            throw new Error('Chat not found');
+        }
+
+        // Update last active timestamp
+        session.lastActive = new Date();
+
+        // Add user message to the session
+        session.messages.push({
+            role: 'user',
+            content,
+            timestamp: new Date()
+        });
+
+        // Create request parameters for the pipeline
+        const requestParams = {
+            chatNoteId: chatNoteId,
+            content,
+            useAdvancedContext: useAdvancedContext === true,
+            showThinking: showThinking === true,
+            stream: true // Always stream for this endpoint
+        };
+
+        // Create a fake request/response pair to pass to the handler
+        const fakeReq = {
+            ...req,
+            method: 'GET', // Set to GET to indicate streaming
+            query: {
+                stream: 'true', // Set stream param - don't use format: 'stream' to avoid confusion
+                useAdvancedContext: String(useAdvancedContext === true),
+                showThinking: String(showThinking === true)
+            },
+            params: {
+                chatNoteId: chatNoteId
+            },
+            // Make sure the original content is available to the handler
+            body: {
+                content,
+                useAdvancedContext: useAdvancedContext === true,
+                showThinking: showThinking === true
+            }
+        } as unknown as Request;
+
+        // Log to verify correct parameters
+        log.info(`WebSocket stream settings - useAdvancedContext=${useAdvancedContext === true}, in query=${fakeReq.query.useAdvancedContext}, in body=${fakeReq.body.useAdvancedContext}`);
+        // Extra safety to ensure the parameters are passed correctly
+        if (useAdvancedContext === true) {
+            log.info(`Enhanced context IS enabled for this request`);
+        } else {
+            log.info(`Enhanced context is NOT enabled for this request`);
+        }
+
+        // Process the request in the background
+        Promise.resolve().then(async () => {
+            try {
+                await restChatService.handleSendMessage(fakeReq, res);
+            } catch (error) {
+                log.error(`Background message processing error: ${error}`);
+
+                // Import the WebSocket service
+                const wsService = (await import('../../services/ws.js')).default;
+
+                // Define LLMStreamMessage interface
+                interface LLMStreamMessage {
+                    type: 'llm-stream';
+                    chatNoteId: string;
+                    content?: string;
+                    thinking?: string;
+                    toolExecution?: any;
+                    done?: boolean;
+                    error?: string;
+                    raw?: unknown;
+                }
+
+                // Send error to client via WebSocket
+                wsService.sendMessageToAllClients({
+                    type: 'llm-stream',
+                    chatNoteId: chatNoteId,
+                    error: `Error processing message: ${error}`,
+                    done: true
+                } as LLMStreamMessage);
+            }
+        });
+
+        // Import the WebSocket service
+        const wsService = (await import('../../services/ws.js')).default;
+
+        // Let the client know streaming has started via WebSocket (helps client confirm connection is working)
+        wsService.sendMessageToAllClients({
+            type: 'llm-stream',
+            chatNoteId: chatNoteId,
+            thinking: 'Initializing streaming LLM response...'
+        });
+
+        // Let the client know streaming has started via HTTP response
+        return {
+            success: true,
+            message: 'Streaming started',
+            chatNoteId: chatNoteId
+        };
+    } catch (error: any) {
+        log.error(`Error starting message stream: ${error.message}`);
+        throw error;
+    }
+}
+
+export default {
+    // Chat session management
+    createSession,
+    getSession,
+    updateSession,
+    listSessions,
+    deleteSession,
+    sendMessage,
+    streamMessage,
+
+    // Knowledge base index management
+    getIndexStats,
+    startIndexing,
+    getFailedIndexes,
+    retryFailedIndex,
+    retryAllFailedIndexes,
+    findSimilarNotes,
+    generateQueryContext,
+    indexNote
+};
diff --git a/src/routes/api/ollama.ts b/src/routes/api/ollama.ts
new file mode 100644
index 000000000..e6ab968dc
--- /dev/null
+++ b/src/routes/api/ollama.ts
@@ -0,0 +1,64 @@
+import options from "../../services/options.js";
+import log from "../../services/log.js";
+import type { Request, Response } from "express";
+import { Ollama } from "ollama";
+
+/**
+ * @swagger
+ * /api/llm/providers/ollama/models:
+ *   get:
+ *     summary: List available models from Ollama
+ *     operationId: ollama-list-models
+ *     parameters:
+ *       - name: baseUrl
+ *         in: query
+ *         required: false
+ *         schema:
+ *           type: string
+ *         description: Optional custom Ollama API base URL
+ *     responses:
+ *       '200':
+ *         description: List of available Ollama models
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *                 models:
+ *                   type: array
+ *                   items:
+ *                     type: object
+ *       '500':
+ *         description: Error listing models
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function listModels(req: Request, res: Response) {
+    try {
+        const baseUrl = req.query.baseUrl as string || await options.getOption('ollamaBaseUrl') || 'http://localhost:11434';
+
+        // Create Ollama client
+        const ollama = new Ollama({ host: baseUrl });
+        
+        // Call Ollama API to get models using the official client
+        const response = await ollama.list();
+
+        // Return the models list
+        return {
+            success: true,
+            models: response.models || []
+        };
+    } catch (error: any) {
+        log.error(`Error listing Ollama models: ${error.message || 'Unknown error'}`);
+
+        // Properly throw the error to be handled by the global error handler
+        throw new Error(`Failed to list Ollama models: ${error.message || 'Unknown error'}`);
+    }
+}
+
+export default {
+    listModels
+};
diff --git a/src/routes/api/openai.ts b/src/routes/api/openai.ts
new file mode 100644
index 000000000..c78f183cd
--- /dev/null
+++ b/src/routes/api/openai.ts
@@ -0,0 +1,127 @@
+import options from "../../services/options.js";
+import log from "../../services/log.js";
+import type { Request, Response } from "express";
+import OpenAI from "openai";
+
+/**
+ * @swagger
+ * /api/openai/models:
+ *   post:
+ *     summary: List available models from OpenAI
+ *     operationId: openai-list-models
+ *     requestBody:
+ *       required: false
+ *       content:
+ *         application/json:
+ *           schema:
+ *             type: object
+ *             properties:
+ *               baseUrl:
+ *                 type: string
+ *                 description: Optional custom OpenAI API base URL
+ *     responses:
+ *       '200':
+ *         description: List of available OpenAI models
+ *         content:
+ *           application/json:
+ *             schema:
+ *               type: object
+ *               properties:
+ *                 success:
+ *                   type: boolean
+ *                 chatModels:
+ *                   type: array
+ *                   items:
+ *                     type: object
+ *                     properties:
+ *                       id:
+ *                         type: string
+ *                       name:
+ *                         type: string
+ *                       type:
+ *                         type: string
+ *                 embeddingModels:
+ *                   type: array
+ *                   items:
+ *                     type: object
+ *                     properties:
+ *                       id:
+ *                         type: string
+ *                       name:
+ *                         type: string
+ *                       type:
+ *                         type: string
+ *       '500':
+ *         description: Error listing models
+ *     security:
+ *       - session: []
+ *     tags: ["llm"]
+ */
+async function listModels(req: Request, res: Response) {
+    try {
+        const { baseUrl } = req.body;
+
+        // Use provided base URL or default from options
+        const openaiBaseUrl = baseUrl || await options.getOption('openaiBaseUrl') || 'https://api.openai.com/v1';
+        const apiKey = await options.getOption('openaiApiKey');
+
+        if (!apiKey) {
+            throw new Error('OpenAI API key is not configured');
+        }
+
+        // Initialize OpenAI client with the API key and base URL
+        const openai = new OpenAI({
+            apiKey,
+            baseURL: openaiBaseUrl
+        });
+
+        // Call OpenAI API to get models using the SDK
+        const response = await openai.models.list();
+
+        // Filter and categorize models
+        const allModels = response.data || [];
+
+        // Separate models into chat models and embedding models
+        const chatModels = allModels
+            .filter((model) =>
+                // Include GPT models for chat
+                model.id.includes('gpt') ||
+                // Include Claude models via Azure OpenAI
+                model.id.includes('claude')
+            )
+            .map((model) => ({
+                id: model.id,
+                name: model.id,
+                type: 'chat'
+            }));
+
+        const embeddingModels = allModels
+            .filter((model) =>
+                // Only include embedding-specific models
+                model.id.includes('embedding') ||
+                model.id.includes('embed')
+            )
+            .map((model) => ({
+                id: model.id,
+                name: model.id,
+                type: 'embedding'
+            }));
+
+        // Return the models list
+        return {
+            success: true,
+            chatModels,
+            embeddingModels
+        };
+    } catch (error: any) {
+        log.error(`Error listing OpenAI models: ${error.message || 'Unknown error'}`);
+
+        // Properly throw the error to be handled by the global error handler
+        throw new Error(`Failed to list OpenAI models: ${error.message || 'Unknown error'}`);
+    }
+}
+
+export default {
+    listModels
+};
+
diff --git a/src/routes/api/options.ts b/src/routes/api/options.ts
index aeb4e9009..60cfc9bb7 100644
--- a/src/routes/api/options.ts
+++ b/src/routes/api/options.ts
@@ -82,7 +82,35 @@ const ALLOWED_OPTIONS = new Set<OptionNames>([
     "allowedHtmlTags",
     "redirectBareDomain",
     "showLoginInShareTheme",
-    "splitEditorOrientation",
+
+    // AI/LLM integration options
+    "aiEnabled",
+    "aiTemperature",
+    "aiSystemPrompt",
+    "aiProviderPrecedence",
+    "openaiApiKey",
+    "openaiBaseUrl",
+    "openaiDefaultModel",
+    "openaiEmbeddingModel",
+    "anthropicApiKey",
+    "anthropicBaseUrl",
+    "anthropicDefaultModel",
+    "voyageApiKey",
+    "voyageEmbeddingModel",
+    "ollamaBaseUrl",
+    "ollamaDefaultModel",
+    "ollamaEmbeddingModel",
+    "embeddingAutoUpdateEnabled",
+    "embeddingDimensionStrategy",
+    "embeddingProviderPrecedence",
+    "embeddingSimilarityThreshold",
+    "embeddingBatchSize",
+    "embeddingUpdateInterval",
+    "enableAutomaticIndexing",
+    "maxNotesPerLlmQuery",
+
+    // Embedding options
+    "embeddingDefaultDimension",
     "mfaEnabled",
     "mfaMethod"
 ]);
diff --git a/src/routes/routes.ts b/src/routes/routes.ts
index 1c7341503..082e05cd0 100644
--- a/src/routes/routes.ts
+++ b/src/routes/routes.ts
@@ -61,6 +61,11 @@ import etapiTokensApiRoutes from "./api/etapi_tokens.js";
 import relationMapApiRoute from "./api/relation-map.js";
 import otherRoute from "./api/other.js";
 import shareRoutes from "../share/routes.js";
+import embeddingsRoute from "./api/embeddings.js";
+import ollamaRoute from "./api/ollama.js";
+import openaiRoute from "./api/openai.js";
+import anthropicRoute from "./api/anthropic.js";
+import llmRoute from "./api/llm.js";
 
 import etapiAuthRoutes from "../etapi/auth.js";
 import etapiAppInfoRoutes from "../etapi/app_info.js";
@@ -387,6 +392,44 @@ function register(app: express.Application) {
     etapiSpecRoute.register(router);
     etapiBackupRoute.register(router);
 
+    // LLM Chat API
+    apiRoute(PST, "/api/llm/chat", llmRoute.createSession);
+    apiRoute(GET, "/api/llm/chat", llmRoute.listSessions);
+    apiRoute(GET, "/api/llm/chat/:sessionId", llmRoute.getSession);
+    apiRoute(PATCH, "/api/llm/chat/:sessionId", llmRoute.updateSession);
+    apiRoute(DEL, "/api/llm/chat/:chatNoteId", llmRoute.deleteSession);
+    apiRoute(PST, "/api/llm/chat/:chatNoteId/messages", llmRoute.sendMessage);
+    apiRoute(PST, "/api/llm/chat/:chatNoteId/messages/stream", llmRoute.streamMessage);
+
+    // LLM index management endpoints - reorganized for REST principles
+    apiRoute(GET, "/api/llm/indexes/stats", llmRoute.getIndexStats);
+    apiRoute(PST, "/api/llm/indexes", llmRoute.startIndexing); // Create index process
+    apiRoute(GET, "/api/llm/indexes/failed", llmRoute.getFailedIndexes);
+    apiRoute(PUT, "/api/llm/indexes/notes/:noteId", llmRoute.retryFailedIndex); // Update index for note
+    apiRoute(PUT, "/api/llm/indexes/failed", llmRoute.retryAllFailedIndexes); // Update all failed indexes
+    apiRoute(GET, "/api/llm/indexes/notes/similar", llmRoute.findSimilarNotes); // Get similar notes
+    apiRoute(GET, "/api/llm/indexes/context", llmRoute.generateQueryContext); // Get context
+    apiRoute(PST, "/api/llm/indexes/notes/:noteId", llmRoute.indexNote); // Create index for specific note
+
+    // LLM embeddings endpoints
+    apiRoute(GET, "/api/llm/embeddings/similar/:noteId", embeddingsRoute.findSimilarNotes);
+    apiRoute(PST, "/api/llm/embeddings/search", embeddingsRoute.searchByText);
+    apiRoute(GET, "/api/llm/embeddings/providers", embeddingsRoute.getProviders);
+    apiRoute(PATCH, "/api/llm/embeddings/providers/:providerId", embeddingsRoute.updateProvider);
+    apiRoute(PST, "/api/llm/embeddings/reprocess", embeddingsRoute.reprocessAllNotes);
+    apiRoute(GET, "/api/llm/embeddings/queue-status", embeddingsRoute.getQueueStatus);
+    apiRoute(GET, "/api/llm/embeddings/stats", embeddingsRoute.getEmbeddingStats);
+    apiRoute(GET, "/api/llm/embeddings/failed", embeddingsRoute.getFailedNotes);
+    apiRoute(PST, "/api/llm/embeddings/retry/:noteId", embeddingsRoute.retryFailedNote);
+    apiRoute(PST, "/api/llm/embeddings/retry-all-failed", embeddingsRoute.retryAllFailedNotes);
+    apiRoute(PST, "/api/llm/embeddings/rebuild-index", embeddingsRoute.rebuildIndex);
+    apiRoute(GET, "/api/llm/embeddings/index-rebuild-status", embeddingsRoute.getIndexRebuildStatus);
+
+    // LLM provider endpoints - moved under /api/llm/providers hierarchy
+    apiRoute(GET, "/api/llm/providers/ollama/models", ollamaRoute.listModels);
+    apiRoute(GET, "/api/llm/providers/openai/models", openaiRoute.listModels);
+    apiRoute(GET, "/api/llm/providers/anthropic/models", anthropicRoute.listModels);
+
     // API Documentation
     apiDocsRoute.register(app);
 
@@ -500,8 +543,14 @@ function route(method: HttpMethod, path: string, middleware: express.Handler[],
 }
 
 function handleResponse(resultHandler: ApiResultHandler, req: express.Request, res: express.Response, result: unknown, start: number) {
-    const responseLength = resultHandler(req, res, result);
+    // Skip result handling if the response has already been handled
+    if ((res as any).triliumResponseHandled) {
+        // Just log the request without additional processing
+        log.request(req, res, Date.now() - start, 0);
+        return;
+    }
 
+    const responseLength = resultHandler(req, res, result);
     log.request(req, res, Date.now() - start, responseLength);
 }
 
diff --git a/src/services/app_info.ts b/src/services/app_info.ts
index bd1436912..60b453f9d 100644
--- a/src/services/app_info.ts
+++ b/src/services/app_info.ts
@@ -3,8 +3,8 @@ import build from "./build.js";
 import packageJson from "../../package.json" with { type: "json" };
 import dataDir from "./data_dir.js";
 
-const APP_DB_VERSION = 229;
-const SYNC_VERSION = 34;
+const APP_DB_VERSION = 230;
+const SYNC_VERSION = 35;
 const CLIPPER_PROTOCOL_VERSION = "1.0";
 
 export default {
diff --git a/src/services/entity_changes.ts b/src/services/entity_changes.ts
index 66c2613ce..a22ecb11c 100644
--- a/src/services/entity_changes.ts
+++ b/src/services/entity_changes.ts
@@ -188,6 +188,7 @@ function fillAllEntityChanges() {
         fillEntityChanges("attributes", "attributeId");
         fillEntityChanges("etapi_tokens", "etapiTokenId");
         fillEntityChanges("options", "name", "WHERE isSynced = 1");
+        fillEntityChanges("note_embeddings", "embedId");
     });
 }
 
diff --git a/src/services/erase.ts b/src/services/erase.ts
index 28603e136..61b3f7ce8 100644
--- a/src/services/erase.ts
+++ b/src/services/erase.ts
@@ -28,6 +28,11 @@ function eraseNotes(noteIdsToErase: string[]) {
 
     eraseRevisions(revisionIdsToErase);
 
+    // Erase embeddings related to the deleted notes
+    const embeddingIdsToErase = sql.getManyRows<{ embedId: string }>(`SELECT embedId FROM note_embeddings WHERE noteId IN (???)`, noteIdsToErase).map((row) => row.embedId);
+
+    eraseEmbeddings(embeddingIdsToErase);
+
     log.info(`Erased notes: ${JSON.stringify(noteIdsToErase)}`);
 }
 
@@ -151,6 +156,13 @@ function eraseNotesWithDeleteId(deleteId: string) {
     const attachmentIdsToErase = sql.getColumn<string>("SELECT attachmentId FROM attachments WHERE isDeleted = 1 AND deleteId = ?", [deleteId]);
     eraseAttachments(attachmentIdsToErase);
 
+    // Find and erase embeddings for deleted notes
+    const deletedNoteIds = sql.getColumn<string>("SELECT noteId FROM notes WHERE isDeleted = 1 AND deleteId = ?", [deleteId]);
+    if (deletedNoteIds.length > 0) {
+        const embeddingIdsToErase = sql.getColumn<string>("SELECT embedId FROM note_embeddings WHERE noteId IN (???)", deletedNoteIds);
+        eraseEmbeddings(embeddingIdsToErase);
+    }
+
     eraseUnusedBlobs();
 }
 
@@ -173,6 +185,17 @@ function eraseScheduledAttachments(eraseUnusedAttachmentsAfterSeconds: number |
     eraseAttachments(attachmentIdsToErase);
 }
 
+function eraseEmbeddings(embedIdsToErase: string[]) {
+    if (embedIdsToErase.length === 0) {
+        return;
+    }
+
+    sql.executeMany(`DELETE FROM note_embeddings WHERE embedId IN (???)`, embedIdsToErase);
+    setEntityChangesAsErased(sql.getManyRows(`SELECT * FROM entity_changes WHERE entityName = 'note_embeddings' AND entityId IN (???)`, embedIdsToErase));
+
+    log.info(`Erased embeddings: ${JSON.stringify(embedIdsToErase)}`);
+}
+
 export function startScheduledCleanup() {
     sqlInit.dbReady.then(() => {
         // first cleanup kickoff 5 minutes after startup
diff --git a/src/services/events.ts b/src/services/events.ts
index 2b24a5826..5ffc93f82 100644
--- a/src/services/events.ts
+++ b/src/services/events.ts
@@ -10,6 +10,7 @@ const ENTITY_CHANGE_SYNCED = "ENTITY_CHANGE_SYNCED";
 const ENTITY_DELETE_SYNCED = "ENTITY_DELETE_SYNCED";
 const CHILD_NOTE_CREATED = "CHILD_NOTE_CREATED";
 const NOTE_CONTENT_CHANGE = "NOTE_CONTENT_CHANGED";
+const DB_INITIALIZED = "DB_INITIALIZED";
 
 type EventType = string | string[];
 type EventListener = (data: any) => void;
@@ -72,5 +73,6 @@ export default {
     ENTITY_CHANGE_SYNCED,
     ENTITY_DELETE_SYNCED,
     CHILD_NOTE_CREATED,
-    NOTE_CONTENT_CHANGE
+    NOTE_CONTENT_CHANGE,
+    DB_INITIALIZED
 };
diff --git a/src/services/hidden_subtree.ts b/src/services/hidden_subtree.ts
index 369b23aea..a66360032 100644
--- a/src/services/hidden_subtree.ts
+++ b/src/services/hidden_subtree.ts
@@ -1,23 +1,29 @@
 import BAttribute from "../becca/entities/battribute.js";
-import type { AttributeType, NoteType } from "../becca/entities/rows.js";
+import type { AttributeType } from "../becca/entities/rows.js";
 
 import becca from "../becca/becca.js";
 import noteService from "./notes.js";
 import log from "./log.js";
 import migrationService from "./migration.js";
+import options from "./options.js";
+import sql from "./sql.js";
 import { t } from "i18next";
 import { cleanUpHelp, getHelpHiddenSubtreeData } from "./in_app_help.js";
 import buildLaunchBarConfig from "./hidden_subtree_launcherbar.js";
 
 const LBTPL_ROOT = "_lbTplRoot";
 const LBTPL_BASE = "_lbTplBase";
-const LBTPL_COMMAND = "_lbTplCommandLauncher";
-const LBTPL_NOTE_LAUNCHER = "_lbTplNoteLauncher";
-const LBTPL_SCRIPT = "_lbTplScriptLauncher";
-const LBTPL_BUILTIN_WIDGET = "_lbTplBuiltinWidget";
+const LBTPL_HEADER = "_lbTplHeader";
+const LBTPL_NOTE_LAUNCHER = "_lbTplLauncherNote";
+const LBTPL_WIDGET = "_lbTplLauncherWidget";
+const LBTPL_COMMAND = "_lbTplLauncherCommand";
+const LBTPL_SCRIPT = "_lbTplLauncherScript";
 const LBTPL_SPACER = "_lbTplSpacer";
 const LBTPL_CUSTOM_WIDGET = "_lbTplCustomWidget";
 
+// Define launcher note types locally
+type LauncherNoteType = "launcher" | "search" | "doc" | "noteMap" | "contentWidget" | "book" | "file" | "image" | "text" | "relationMap" | "render" | "canvas" | "mermaid" | "webView" | "code" | "mindMap" | "geoMap";
+
 interface HiddenSubtreeAttribute {
     type: AttributeType;
     name: string;
@@ -29,7 +35,7 @@ export interface HiddenSubtreeItem {
     notePosition?: number;
     id: string;
     title: string;
-    type: NoteType;
+    type: LauncherNoteType;
     icon?: string;
     attributes?: HiddenSubtreeAttribute[];
     children?: HiddenSubtreeItem[];
@@ -37,7 +43,17 @@ export interface HiddenSubtreeItem {
     baseSize?: string;
     growthFactor?: string;
     targetNoteId?: "_backendLog" | "_globalNoteMap";
-    builtinWidget?: "bookmarks" | "spacer" | "backInHistoryButton" | "forwardInHistoryButton" | "syncStatus" | "protectedSession" | "todayInJournal" | "calendar" | "quickSearch";
+    builtinWidget?:
+        | "todayInJournal"
+        | "bookmarks"
+        | "spacer"
+        | "backInHistoryButton"
+        | "forwardInHistoryButton"
+        | "syncStatus"
+        | "protectedSession"
+        | "calendar"
+        | "quickSearch"
+        | "aiChatLauncher";
     command?: keyof typeof Command;
 }
 
@@ -47,7 +63,8 @@ enum Command {
     searchNotes,
     createNoteIntoInbox,
     showRecentChanges,
-    showOptions
+    showOptions,
+    createAiChat
 }
 
 /*
@@ -168,7 +185,7 @@ function buildHiddenSubtreeDefinition(helpSubtree: HiddenSubtreeItem[]): HiddenS
                         ]
                     },
                     {
-                        id: LBTPL_BUILTIN_WIDGET,
+                        id: LBTPL_WIDGET,
                         title: t("hidden-subtree.built-in-widget-title"),
                         type: "doc",
                         attributes: [
@@ -182,7 +199,7 @@ function buildHiddenSubtreeDefinition(helpSubtree: HiddenSubtreeItem[]): HiddenS
                         type: "doc",
                         icon: "bx-move-vertical",
                         attributes: [
-                            { type: "relation", name: "template", value: LBTPL_BUILTIN_WIDGET },
+                            { type: "relation", name: "template", value: LBTPL_WIDGET },
                             { type: "label", name: "builtinWidget", value: "spacer" },
                             { type: "label", name: "label:baseSize", value: "promoted,number" },
                             { type: "label", name: "label:growthFactor", value: "promoted,number" },
@@ -275,6 +292,7 @@ function buildHiddenSubtreeDefinition(helpSubtree: HiddenSubtreeItem[]): HiddenS
                     { id: "_optionsEtapi", title: t("hidden-subtree.etapi-title"), type: "contentWidget", icon: "bx-extension" },
                     { id: "_optionsBackup", title: t("hidden-subtree.backup-title"), type: "contentWidget", icon: "bx-data" },
                     { id: "_optionsSync", title: t("hidden-subtree.sync-title"), type: "contentWidget", icon: "bx-wifi" },
+                    { id: "_optionsAi", title: t("hidden-subtree.ai-llm-title"), type: "contentWidget", icon: "bx-bot" },
                     { id: "_optionsOther", title: t("hidden-subtree.other"), type: "contentWidget", icon: "bx-dots-horizontal" },
                     { id: "_optionsLocalization", title: t("hidden-subtree.localization"), type: "contentWidget", icon: "bx-world" },
                     { id: "_optionsAdvanced", title: t("hidden-subtree.advanced-title"), type: "contentWidget" }
@@ -359,7 +377,7 @@ function checkHiddenSubtreeRecursively(parentNoteId: string, item: HiddenSubtree
                 attrs.push({ type: "label", name: "baseSize", value: item.baseSize });
                 attrs.push({ type: "label", name: "growthFactor", value: item.growthFactor });
             } else {
-                attrs.push({ type: "relation", name: "template", value: LBTPL_BUILTIN_WIDGET });
+                attrs.push({ type: "relation", name: "template", value: LBTPL_WIDGET });
             }
 
             attrs.push({ type: "label", name: "builtinWidget", value: item.builtinWidget });
@@ -430,8 +448,8 @@ export default {
     LBTPL_BASE,
     LBTPL_COMMAND,
     LBTPL_NOTE_LAUNCHER,
+    LBTPL_WIDGET,
     LBTPL_SCRIPT,
-    LBTPL_BUILTIN_WIDGET,
     LBTPL_SPACER,
     LBTPL_CUSTOM_WIDGET
 };
diff --git a/src/services/hidden_subtree_launcherbar.ts b/src/services/hidden_subtree_launcherbar.ts
index 0ee41f2e6..602d09bb3 100644
--- a/src/services/hidden_subtree_launcherbar.ts
+++ b/src/services/hidden_subtree_launcherbar.ts
@@ -46,7 +46,7 @@ export default function buildLaunchBarConfig() {
     const desktopAvailableLaunchers: HiddenSubtreeItem[] = [
         { id: "_lbBackInHistory", ...sharedLaunchers.backInHistory },
         { id: "_lbForwardInHistory", ...sharedLaunchers.forwardInHistory },
-        { id: "_lbBackendLog", title: t("hidden-subtree.backend-log-title"), type: "launcher", targetNoteId: "_backendLog", icon: "bx bx-terminal" }
+        { id: "_lbBackendLog", title: t("hidden-subtree.backend-log-title"), type: "launcher", targetNoteId: "_backendLog", icon: "bx bx-terminal" },
     ];
 
     const desktopVisibleLaunchers: HiddenSubtreeItem[] = [
@@ -68,6 +68,16 @@ export default function buildLaunchBarConfig() {
             attributes: [{ type: "label", name: "desktopOnly" }]
         },
         { id: "_lbNoteMap", title: t("hidden-subtree.note-map-title"), type: "launcher", targetNoteId: "_globalNoteMap", icon: "bx bxs-network-chart" },
+        {
+            id: "_lbLlmChat",
+            title: t("hidden-subtree.llm-chat-title"),
+            type: "launcher",
+            command: "createAiChat",
+            icon: "bx bx-bot",
+            attributes: [
+                { type: "label", name: "desktopOnly" }
+            ]
+        },
         { id: "_lbCalendar", ...sharedLaunchers.calendar },
         { id: "_lbRecentChanges", ...sharedLaunchers.recentChanges },
         { id: "_lbSpacer1", title: t("hidden-subtree.spacer-title"), type: "launcher", builtinWidget: "spacer", baseSize: "50", growthFactor: "0" },
diff --git a/src/services/llm/README.md b/src/services/llm/README.md
new file mode 100644
index 000000000..dce7887ee
--- /dev/null
+++ b/src/services/llm/README.md
@@ -0,0 +1,144 @@
+# Trilium Context Service
+
+This directory contains Trilium's context management services, which are responsible for providing relevant context to LLM models when generating responses.
+
+## Structure
+
+The context system has been refactored into a modular architecture:
+
+```
+context/
+  ├── index.ts              - Base context extractor
+  ├── semantic_context.ts   - Semantic context utilities
+  ├── hierarchy.ts          - Note hierarchy context utilities
+  ├── code_handlers.ts      - Code-specific context handling
+  ├── content_chunking.ts   - Content chunking utilities
+  ├── note_content.ts       - Note content processing
+  ├── summarization.ts      - Content summarization utilities
+  ├── modules/              - Modular context services
+  │   ├── provider_manager.ts  - Embedding provider management
+  │   ├── cache_manager.ts     - Caching system
+  │   ├── semantic_search.ts   - Semantic search functionality
+  │   ├── query_enhancer.ts    - Query enhancement
+  │   ├── context_formatter.ts - Context formatting
+  │   └── context_service.ts   - Main context service
+  └── README.md             - This documentation
+```
+
+## Main Entry Points
+
+- `context_service.ts` - Main entry point for modern code
+- `semantic_context_service.ts` - Compatibility wrapper for old code (deprecated)
+- `trilium_context_service.ts` - Compatibility wrapper for old code (deprecated)
+
+## Usage
+
+### For new code:
+
+```typescript
+import aiServiceManager from '../services/llm/ai_service_manager.js';
+
+// Get the context service
+const contextService = aiServiceManager.getContextService();
+
+// Process a query to get relevant context
+const result = await contextService.processQuery(
+    "What are my notes about programming?",
+    llmService,
+    currentNoteId,
+    false // showThinking
+);
+
+// Get semantic context
+const context = await contextService.getSemanticContext(noteId, userQuery);
+
+// Get context that adapts to query complexity
+const smartContext = await contextService.getSmartContext(noteId, userQuery);
+```
+
+### For legacy code (deprecated):
+
+```typescript
+import aiServiceManager from '../services/llm/ai_service_manager.js';
+
+// Get the semantic context service (deprecated)
+const semanticContext = aiServiceManager.getSemanticContextService();
+
+// Get context
+const context = await semanticContext.getSemanticContext(noteId, userQuery);
+```
+
+## Modules
+
+### Provider Manager
+
+Handles embedding provider selection and management:
+
+```typescript
+import providerManager from './context/modules/provider_manager.js';
+
+// Get the preferred embedding provider
+const provider = await providerManager.getPreferredEmbeddingProvider();
+
+// Generate embeddings for a query
+const embedding = await providerManager.generateQueryEmbedding(query);
+```
+
+### Cache Manager
+
+Provides caching for context data:
+
+```typescript
+import cacheManager from './context/modules/cache_manager.js';
+
+// Get cached data
+const cached = cacheManager.getNoteData(noteId, 'content');
+
+// Store data in cache
+cacheManager.storeNoteData(noteId, 'content', data);
+
+// Clear caches
+cacheManager.clearAllCaches();
+```
+
+### Semantic Search
+
+Handles semantic search functionality:
+
+```typescript
+import semanticSearch from './context/modules/semantic_search.js';
+
+// Find relevant notes
+const notes = await semanticSearch.findRelevantNotes(query, contextNoteId);
+
+// Rank notes by relevance
+const ranked = await semanticSearch.rankNotesByRelevance(notes, query);
+```
+
+### Query Enhancer
+
+Provides query enhancement:
+
+```typescript
+import queryEnhancer from './context/modules/query_enhancer.js';
+
+// Generate multiple search queries from a user question
+const queries = await queryEnhancer.generateSearchQueries(question, llmService);
+
+// Estimate query complexity
+const complexity = queryEnhancer.estimateQueryComplexity(query);
+```
+
+### Context Formatter
+
+Formats context for LLM consumption:
+
+```typescript
+import contextFormatter from './context/modules/context_formatter.js';
+
+// Build formatted context from notes
+const context = await contextFormatter.buildContextFromNotes(notes, query, providerId);
+
+// Sanitize note content
+const clean = contextFormatter.sanitizeNoteContent(content, type, mime);
+``` 
\ No newline at end of file
diff --git a/src/services/llm/ai_interface.ts b/src/services/llm/ai_interface.ts
new file mode 100644
index 000000000..b8349b5b2
--- /dev/null
+++ b/src/services/llm/ai_interface.ts
@@ -0,0 +1,262 @@
+import type { ToolCall } from './tools/tool_interfaces.js';
+import type { ModelMetadata } from './providers/provider_options.js';
+
+/**
+ * Interface for chat messages between client and LLM models
+ */
+export interface Message {
+    role: 'user' | 'assistant' | 'system' | 'tool';
+    content: string;
+    name?: string;
+    tool_call_id?: string;
+    tool_calls?: ToolCall[];
+    sessionId?: string; // Optional session ID for WebSocket communication
+}
+
+// Define additional interfaces for tool-related types
+export interface ToolChoice {
+    type: 'none' | 'auto' | 'function';
+    function?: {
+        name: string;
+    };
+}
+
+export interface ToolData {
+    type: 'function';
+    function: {
+        name: string;
+        description: string;
+        parameters: Record<string, unknown>;
+    };
+}
+
+export interface ToolExecutionInfo {
+    type: 'start' | 'update' | 'complete' | 'error';
+    tool: {
+        name: string;
+        arguments: Record<string, unknown>;
+    };
+    result?: string | Record<string, unknown>;
+}
+
+/**
+ * Interface for streaming response chunks
+ *
+ * This is the standardized format for all streaming chunks across
+ * different providers (OpenAI, Anthropic, Ollama, etc.).
+ * The original provider-specific chunks are available through
+ * the extended interface in the stream_manager.
+ *
+ * See STREAMING.md for complete documentation on streaming usage.
+ */
+export interface StreamChunk {
+    /** The text content in this chunk (may be empty for status updates) */
+    text: string;
+
+    /** Whether this is the final chunk in the stream */
+    done: boolean;
+
+    /** Optional token usage statistics (rarely available in streaming mode) */
+    usage?: {
+        promptTokens?: number;
+        completionTokens?: number;
+        totalTokens?: number;
+    };
+
+    /**
+     * Raw provider-specific data from the original response chunk
+     * This can include thinking state, tool execution info, etc.
+     */
+    raw?: Record<string, unknown>;
+
+    /**
+     * Tool calls from the LLM (if any)
+     * These may be accumulated over multiple chunks during streaming
+     */
+    tool_calls?: ToolCall[];
+
+    /**
+     * Tool execution information during streaming
+     * Includes tool name, args, and execution status
+     */
+    toolExecution?: ToolExecutionInfo;
+}
+
+/**
+ * Tool execution status for feedback to models
+ */
+export interface ToolExecutionStatus {
+    toolCallId: string;
+    name: string;
+    success: boolean;
+    result: string;
+    error?: string;
+}
+
+/**
+ * Options for chat completion requests
+ *
+ * Key properties:
+ * - stream: If true, the response will be streamed
+ * - model: Model name to use
+ * - provider: Provider to use (openai, anthropic, ollama, etc.)
+ * - enableTools: If true, enables tool support
+ *
+ * The stream option is particularly important and should be consistently handled
+ * throughout the pipeline. It should be explicitly set to true or false.
+ *
+ * Streaming supports two approaches:
+ * 1. Callback-based: Provide a streamCallback to receive chunks directly
+ * 2. API-based: Use the stream property in the response to process chunks
+ *
+ * See STREAMING.md for complete documentation on streaming usage.
+ */
+export interface ChatCompletionOptions {
+    model?: string;
+    temperature?: number;
+    maxTokens?: number;
+    topP?: number;
+    frequencyPenalty?: number;
+    presencePenalty?: number;
+    showThinking?: boolean;
+    systemPrompt?: string;
+    preserveSystemPrompt?: boolean; // Whether to preserve existing system message
+    bypassFormatter?: boolean; // Whether to bypass the message formatter entirely
+    expectsJsonResponse?: boolean; // Whether this request expects a JSON response
+
+    /**
+     * Whether to stream the response
+     * When true, response will be delivered incrementally via either:
+     * - The streamCallback if provided
+     * - The stream property in the response object
+     */
+    stream?: boolean;
+
+    /**
+     * Optional callback function for streaming responses
+     * When provided along with stream:true, this function will be called
+     * for each chunk of the response.
+     *
+     * @param text The text content in this chunk
+     * @param isDone Whether this is the final chunk
+     * @param originalChunk Optional original provider-specific chunk for advanced usage
+     */
+    streamCallback?: (text: string, isDone: boolean, originalChunk?: Record<string, unknown>) => Promise<void> | void;
+
+    enableTools?: boolean; // Whether to enable tool calling
+    tools?: ToolData[]; // Tools to provide to the LLM
+    tool_choice?: ToolChoice; // Tool choice parameter for the LLM
+    useAdvancedContext?: boolean; // Whether to use advanced context enrichment
+    toolExecutionStatus?: ToolExecutionStatus[]; // Status information about executed tools for feedback
+    providerMetadata?: ModelMetadata; // Metadata about the provider and model capabilities
+    sessionId?: string; // Session ID for storing tool execution results
+
+    /**
+     * Maximum number of tool execution iterations
+     * Used to prevent infinite loops in tool execution
+     */
+    maxToolIterations?: number;
+
+    /**
+     * Current tool execution iteration counter
+     * Internal use for tracking nested tool executions
+     */
+    currentToolIteration?: number;
+}
+
+/**
+ * Response from a chat completion request
+ *
+ * When streaming is used, the behavior depends on how streaming was requested:
+ *
+ * 1. With streamCallback: The text field contains the complete response
+ *    collected from all chunks, and the stream property is not present.
+ *
+ * 2. Without streamCallback: The text field is initially empty, and the
+ *    stream property provides a function to process chunks and collect
+ *    the complete response.
+ *
+ * See STREAMING.md for complete documentation on streaming usage.
+ */
+export interface ChatResponse {
+    /**
+     * The complete text response.
+     * If streaming was used with streamCallback, this contains the collected response.
+     * If streaming was used without streamCallback, this is initially empty.
+     */
+    text: string;
+
+    /** The model that generated the response */
+    model: string;
+
+    /** The provider that served the request (openai, anthropic, ollama, etc.) */
+    provider: string;
+
+    /** Token usage statistics (may not be available when streaming) */
+    usage?: {
+        promptTokens?: number;
+        completionTokens?: number;
+        totalTokens?: number;
+    };
+
+    /**
+     * Stream processor function - only present when streaming is enabled
+     * without a streamCallback. When called with a chunk processor function,
+     * it returns a Promise that resolves to the complete response text.
+     *
+     * @param callback Function to process each chunk of the stream
+     * @returns Promise resolving to the complete text after stream processing
+     */
+    stream?: (callback: (chunk: StreamChunk) => Promise<void> | void) => Promise<string>;
+
+    /** Tool calls from the LLM (if tools were used and the model supports them) */
+    tool_calls?: ToolCall[];
+}
+
+export interface AIService {
+    /**
+     * Generate a chat completion response
+     */
+    generateChatCompletion(messages: Message[], options?: ChatCompletionOptions): Promise<ChatResponse>;
+
+    /**
+     * Check if the service can be used (API key is set, etc.)
+     */
+    isAvailable(): boolean;
+
+    /**
+     * Get the name of the service
+     */
+    getName(): string;
+}
+
+/**
+ * Interface for the semantic context service, which provides enhanced context retrieval
+ * for AI conversations based on semantic similarity.
+ */
+export interface SemanticContextService {
+    /**
+     * Initialize the semantic context service
+     */
+    initialize(): Promise<void>;
+
+    /**
+     * Retrieve semantic context based on relevance to user query
+     */
+    getSemanticContext(noteId: string, userQuery: string, maxResults?: number, messages?: Message[]): Promise<string>;
+
+    /**
+     * Get progressive context based on depth
+     */
+    getProgressiveContext?(noteId: string, depth?: number): Promise<string>;
+
+    /**
+     * Get smart context selection that adapts to query complexity
+     */
+    getSmartContext?(noteId: string, userQuery: string): Promise<string>;
+
+    /**
+     * Enhance LLM context with agent tools
+     */
+    getAgentToolsContext(noteId: string, query: string, showThinking?: boolean): Promise<string>;
+}
diff --git a/src/services/llm/ai_service_manager.ts b/src/services/llm/ai_service_manager.ts
new file mode 100644
index 000000000..c9c0581f3
--- /dev/null
+++ b/src/services/llm/ai_service_manager.ts
@@ -0,0 +1,709 @@
+import options from '../options.js';
+import type { AIService, ChatCompletionOptions, ChatResponse, Message } from './ai_interface.js';
+import { AnthropicService } from './providers/anthropic_service.js';
+import { ContextExtractor } from './context/index.js';
+import agentTools from './context_extractors/index.js';
+import contextService from './context/services/context_service.js';
+import { getEmbeddingProvider, getEnabledEmbeddingProviders } from './providers/providers.js';
+import indexService from './index_service.js';
+import log from '../log.js';
+import { OllamaService } from './providers/ollama_service.js';
+import { OpenAIService } from './providers/openai_service.js';
+
+// Import interfaces
+import type {
+  ServiceProviders,
+  IAIServiceManager,
+  ProviderMetadata
+} from './interfaces/ai_service_interfaces.js';
+import type { NoteSearchResult } from './interfaces/context_interfaces.js';
+
+/**
+ * Interface representing relevant note context
+ */
+interface NoteContext {
+    title: string;
+    content?: string;
+    noteId?: string;
+    summary?: string;
+    score?: number;
+}
+
+export class AIServiceManager implements IAIServiceManager {
+    private services: Record<ServiceProviders, AIService> = {
+        openai: new OpenAIService(),
+        anthropic: new AnthropicService(),
+        ollama: new OllamaService()
+    };
+
+    private providerOrder: ServiceProviders[] = ['openai', 'anthropic', 'ollama']; // Default order
+    private initialized = false;
+
+    constructor() {
+        // Initialize provider order immediately
+        this.updateProviderOrder();
+
+        // Initialize tools immediately
+        this.initializeTools().catch(error => {
+            log.error(`Error initializing LLM tools during AIServiceManager construction: ${error.message || String(error)}`);
+        });
+    }
+
+    /**
+     * Initialize all LLM tools in one place
+     */
+    private async initializeTools(): Promise<void> {
+        try {
+            log.info('Initializing LLM tools during AIServiceManager construction...');
+
+            // Initialize agent tools
+            await this.initializeAgentTools();
+            log.info("Agent tools initialized successfully");
+
+            // Initialize LLM tools
+            const toolInitializer = await import('./tools/tool_initializer.js');
+            await toolInitializer.default.initializeTools();
+            log.info("LLM tools initialized successfully");
+        } catch (error: unknown) {
+            log.error(`Error initializing tools: ${this.handleError(error)}`);
+            // Don't throw, just log the error to prevent breaking construction
+        }
+    }
+
+    /**
+     * Update the provider precedence order from saved options
+     * Returns true if successful, false if options not available yet
+     */
+    updateProviderOrder(): boolean {
+        if (this.initialized) {
+            return true;
+        }
+
+        try {
+            // Default precedence: openai, anthropic, ollama
+            const defaultOrder: ServiceProviders[] = ['openai', 'anthropic', 'ollama'];
+
+            // Get custom order from options
+            const customOrder = options.getOption('aiProviderPrecedence');
+
+            if (customOrder) {
+                try {
+                    // Try to parse as JSON first
+                    let parsed;
+
+                    // Handle both array in JSON format and simple string format
+                    if (customOrder.startsWith('[') && customOrder.endsWith(']')) {
+                        parsed = JSON.parse(customOrder);
+                    } else if (typeof customOrder === 'string') {
+                        // If it's a string with commas, split it
+                        if (customOrder.includes(',')) {
+                            parsed = customOrder.split(',').map(p => p.trim());
+                        } else {
+                            // If it's a simple string (like "ollama"), convert to single-item array
+                            parsed = [customOrder];
+                        }
+                    } else {
+                        // Fallback to default
+                        parsed = defaultOrder;
+                    }
+
+                    // Validate that all providers are valid
+                    if (Array.isArray(parsed) &&
+                        parsed.every(p => Object.keys(this.services).includes(p))) {
+                        this.providerOrder = parsed as ServiceProviders[];
+                    } else {
+                        log.info('Invalid AI provider precedence format, using defaults');
+                        this.providerOrder = defaultOrder;
+                    }
+                } catch (e) {
+                    log.error(`Failed to parse AI provider precedence: ${e}`);
+                    this.providerOrder = defaultOrder;
+                }
+            } else {
+                this.providerOrder = defaultOrder;
+            }
+
+            this.initialized = true;
+
+            // Remove the validateEmbeddingProviders call since we now do validation on the client
+            // this.validateEmbeddingProviders();
+
+            return true;
+        } catch (error) {
+            // If options table doesn't exist yet, use defaults
+            // This happens during initial database creation
+            this.providerOrder = ['openai', 'anthropic', 'ollama'];
+            return false;
+        }
+    }
+
+    /**
+     * Validate embedding providers configuration
+     * - Check if embedding default provider is in provider precedence list
+     * - Check if all providers in precedence list and default provider are enabled
+     *
+     * @returns A warning message if there are issues, or null if everything is fine
+     */
+    async validateEmbeddingProviders(): Promise<string | null> {
+        try {
+            // Check if AI is enabled, if not, skip validation
+            const aiEnabled = await options.getOptionBool('aiEnabled');
+            if (!aiEnabled) {
+                return null;
+            }
+
+            // Parse provider precedence list (similar to updateProviderOrder)
+            let precedenceList: string[] = [];
+            const precedenceOption = await options.getOption('aiProviderPrecedence');
+
+            if (precedenceOption) {
+                if (precedenceOption.startsWith('[') && precedenceOption.endsWith(']')) {
+                    precedenceList = JSON.parse(precedenceOption);
+                } else if (typeof precedenceOption === 'string') {
+                    if (precedenceOption.includes(',')) {
+                        precedenceList = precedenceOption.split(',').map(p => p.trim());
+                    } else {
+                        precedenceList = [precedenceOption];
+                    }
+                }
+            }
+
+            // Get enabled providers
+            const enabledProviders = await getEnabledEmbeddingProviders();
+            const enabledProviderNames = enabledProviders.map(p => p.name);
+
+            // Check if all providers in precedence list are enabled
+            const allPrecedenceEnabled = precedenceList.every(p =>
+                enabledProviderNames.includes(p) || p === 'local');
+
+            // Return warning message if there are issues
+            if (!allPrecedenceEnabled) {
+                let message = 'There are issues with your AI provider configuration:';
+
+                if (!allPrecedenceEnabled) {
+                    const disabledProviders = precedenceList.filter(p =>
+                        !enabledProviderNames.includes(p) && p !== 'local');
+                    message += `\n• The following providers in your precedence list are not enabled: ${disabledProviders.join(', ')}.`;
+                }
+
+                message += '\n\nPlease check your AI settings.';
+
+                // Log warning to console
+                log.error('AI Provider Configuration Warning: ' + message);
+
+                return message;
+            }
+
+            return null;
+        } catch (error) {
+            log.error(`Error validating embedding providers: ${error}`);
+            return null;
+        }
+    }
+
+    /**
+     * Ensure manager is initialized before using
+     */
+    private ensureInitialized() {
+        if (!this.initialized) {
+            this.updateProviderOrder();
+        }
+    }
+
+    /**
+     * Check if any AI service is available
+     */
+    isAnyServiceAvailable(): boolean {
+        return Object.values(this.services).some(service => service.isAvailable());
+    }
+
+    /**
+     * Get list of available providers
+     */
+    getAvailableProviders(): ServiceProviders[] {
+        this.ensureInitialized();
+        return Object.entries(this.services)
+            .filter(([_, service]) => service.isAvailable())
+            .map(([key, _]) => key as ServiceProviders);
+    }
+
+    /**
+     * Generate a chat completion response using the first available AI service
+     * based on the configured precedence order
+     */
+    async generateChatCompletion(messages: Message[], options: ChatCompletionOptions = {}): Promise<ChatResponse> {
+        this.ensureInitialized();
+
+        log.info(`[AIServiceManager] generateChatCompletion called with options: ${JSON.stringify({
+            model: options.model,
+            stream: options.stream,
+            enableTools: options.enableTools
+        })}`);
+        log.info(`[AIServiceManager] Stream option type: ${typeof options.stream}`);
+
+        if (!messages || messages.length === 0) {
+            throw new Error('No messages provided for chat completion');
+        }
+
+        // Try providers in order of preference
+        const availableProviders = this.getAvailableProviders();
+
+        if (availableProviders.length === 0) {
+            throw new Error('No AI providers are available. Please check your AI settings.');
+        }
+
+        // Sort available providers by precedence
+        const sortedProviders = this.providerOrder
+            .filter(provider => availableProviders.includes(provider));
+
+        // If a specific provider is requested and available, use it
+        if (options.model && options.model.includes(':')) {
+            const [providerName, modelName] = options.model.split(':');
+
+            if (availableProviders.includes(providerName as ServiceProviders)) {
+                try {
+                    const modifiedOptions = { ...options, model: modelName };
+                    log.info(`[AIServiceManager] Using provider ${providerName} from model prefix with modifiedOptions.stream: ${modifiedOptions.stream}`);
+                    return await this.services[providerName as ServiceProviders].generateChatCompletion(messages, modifiedOptions);
+                } catch (error) {
+                    log.error(`Error with specified provider ${providerName}: ${error}`);
+                    // If the specified provider fails, continue with the fallback providers
+                }
+            }
+        }
+
+        // Try each provider in order until one succeeds
+        let lastError: Error | null = null;
+
+        for (const provider of sortedProviders) {
+            try {
+                log.info(`[AIServiceManager] Trying provider ${provider} with options.stream: ${options.stream}`);
+                return await this.services[provider].generateChatCompletion(messages, options);
+            } catch (error) {
+                log.error(`Error with provider ${provider}: ${error}`);
+                lastError = error as Error;
+                // Continue to the next provider
+            }
+        }
+
+        // If we get here, all providers failed
+        throw new Error(`All AI providers failed: ${lastError?.message || 'Unknown error'}`);
+    }
+
+    setupEventListeners() {
+        // Setup event listeners for AI services
+    }
+
+    /**
+     * Get the context extractor service
+     * @returns The context extractor instance
+     */
+    getContextExtractor() {
+        return contextExtractor;
+    }
+
+    /**
+     * Get the context service for advanced context management
+     * @returns The context service instance
+     */
+    getContextService() {
+        return contextService;
+    }
+
+    /**
+     * Get the index service for managing knowledge base indexing
+     * @returns The index service instance
+     */
+    getIndexService() {
+        return indexService;
+    }
+
+    /**
+     * Ensure agent tools are initialized (no-op as they're initialized in constructor)
+     * Kept for backward compatibility with existing API
+     */
+    async initializeAgentTools(): Promise<void> {
+        // Agent tools are already initialized in the constructor
+        // This method is kept for backward compatibility
+        log.info("initializeAgentTools called, but tools are already initialized in constructor");
+    }
+
+    /**
+     * Get the agent tools manager
+     * This provides access to all agent tools
+     */
+    getAgentTools() {
+        return agentTools;
+    }
+
+    /**
+     * Get the vector search tool for semantic similarity search
+     */
+    getVectorSearchTool() {
+        const tools = agentTools.getTools();
+        return tools.vectorSearch;
+    }
+
+    /**
+     * Get the note navigator tool for hierarchical exploration
+     */
+    getNoteNavigatorTool() {
+        const tools = agentTools.getTools();
+        return tools.noteNavigator;
+    }
+
+    /**
+     * Get the query decomposition tool for complex queries
+     */
+    getQueryDecompositionTool() {
+        const tools = agentTools.getTools();
+        return tools.queryDecomposition;
+    }
+
+    /**
+     * Get the contextual thinking tool for transparent reasoning
+     */
+    getContextualThinkingTool() {
+        const tools = agentTools.getTools();
+        return tools.contextualThinking;
+    }
+
+    /**
+     * Get whether AI features are enabled from options
+     */
+    getAIEnabled(): boolean {
+        return options.getOptionBool('aiEnabled');
+    }
+
+    /**
+     * Set up embeddings provider for AI features
+     */
+    async setupEmbeddingsProvider(): Promise<void> {
+        try {
+            if (!this.getAIEnabled()) {
+                log.info('AI features are disabled');
+                return;
+            }
+
+            // Get provider precedence list
+            const precedenceOption = await options.getOption('embeddingProviderPrecedence');
+            let precedenceList: string[] = [];
+
+            if (precedenceOption) {
+                if (precedenceOption.startsWith('[') && precedenceOption.endsWith(']')) {
+                    precedenceList = JSON.parse(precedenceOption);
+                } else if (typeof precedenceOption === 'string') {
+                    if (precedenceOption.includes(',')) {
+                        precedenceList = precedenceOption.split(',').map(p => p.trim());
+                    } else {
+                        precedenceList = [precedenceOption];
+                    }
+                }
+            }
+
+            // Check if we have enabled providers
+            const enabledProviders = await getEnabledEmbeddingProviders();
+
+            if (enabledProviders.length === 0) {
+                log.info('No embedding providers are enabled');
+                return;
+            }
+
+            // Initialize embedding providers
+            log.info('Embedding providers initialized successfully');
+        } catch (error: any) {
+            log.error(`Error setting up embedding providers: ${error.message}`);
+            throw error;
+        }
+    }
+
+    /**
+     * Initialize the AI Service
+     */
+    async initialize(): Promise<void> {
+        try {
+            log.info("Initializing AI service...");
+
+            // Check if AI is enabled in options
+            const isAIEnabled = this.getAIEnabled();
+
+            if (!isAIEnabled) {
+                log.info("AI features are disabled in options");
+                return;
+            }
+
+            // Set up embeddings provider if AI is enabled
+            await this.setupEmbeddingsProvider();
+
+            // Initialize index service
+            await this.getIndexService().initialize();
+
+            // Tools are already initialized in the constructor
+            // No need to initialize them again
+
+            this.initialized = true;
+            log.info("AI service initialized successfully");
+        } catch (error: any) {
+            log.error(`Error initializing AI service: ${error.message}`);
+            throw error;
+        }
+    }
+
+    /**
+     * Get description of available agent tools
+     */
+    async getAgentToolsDescription(): Promise<string> {
+        try {
+            // Get all available tools
+            const tools = agentTools.getAllTools();
+
+            if (!tools || tools.length === 0) {
+                return "";
+            }
+
+            // Format tool descriptions
+            const toolDescriptions = tools.map(tool =>
+                `- ${tool.name}: ${tool.description}`
+            ).join('\n');
+
+            return `Available tools:\n${toolDescriptions}`;
+        } catch (error) {
+            log.error(`Error getting agent tools description: ${error}`);
+            return "";
+        }
+    }
+
+    /**
+     * Get enhanced context with available agent tools
+     * @param noteId - The ID of the note
+     * @param query - The user's query
+     * @param showThinking - Whether to show LLM's thinking process
+     * @param relevantNotes - Optional notes already found to be relevant
+     * @returns Enhanced context with agent tools information
+     */
+    async getAgentToolsContext(
+        noteId: string,
+        query: string,
+        showThinking: boolean = false,
+        relevantNotes: NoteSearchResult[] = []
+    ): Promise<string> {
+        try {
+            // Create agent tools message
+            const toolsMessage = await this.getAgentToolsDescription();
+
+            // Agent tools are already initialized in the constructor
+            // No need to initialize them again
+
+            // If we have notes that were already found to be relevant, use them directly
+            let contextNotes = relevantNotes;
+
+            // If no notes provided, find relevant ones
+            if (!contextNotes || contextNotes.length === 0) {
+                try {
+                    // Get the default LLM service for context enhancement
+                    const provider = this.getPreferredProvider();
+                    const llmService = this.getService(provider);
+
+                    // Find relevant notes
+                    contextNotes = await contextService.findRelevantNotes(
+                        query,
+                        noteId,
+                        {
+                            maxResults: 5,
+                            summarize: true,
+                            llmService
+                        }
+                    );
+
+                    log.info(`Found ${contextNotes.length} relevant notes for context`);
+                } catch (error) {
+                    log.error(`Failed to find relevant notes: ${this.handleError(error)}`);
+                    // Continue without context notes
+                    contextNotes = [];
+                }
+            }
+
+            // Format notes into context string if we have any
+            let contextStr = "";
+            if (contextNotes && contextNotes.length > 0) {
+                contextStr = "\n\nRelevant context:\n";
+                contextNotes.forEach((note, index) => {
+                    contextStr += `[${index + 1}] "${note.title}"\n${note.content || 'No content available'}\n\n`;
+                });
+            }
+
+            // Combine tool message with context
+            return toolsMessage + contextStr;
+        } catch (error) {
+            log.error(`Error getting agent tools context: ${this.handleError(error)}`);
+            return "";
+        }
+    }
+
+    /**
+     * Get AI service for the given provider
+     */
+    getService(provider?: string): AIService {
+        this.ensureInitialized();
+
+        // If provider is specified, try to use it
+        if (provider && this.services[provider as ServiceProviders]?.isAvailable()) {
+            return this.services[provider as ServiceProviders];
+        }
+
+        // Otherwise, use the first available provider in the configured order
+        for (const providerName of this.providerOrder) {
+            const service = this.services[providerName];
+            if (service.isAvailable()) {
+                return service;
+            }
+        }
+
+        // If no provider is available, use first one anyway (it will throw an error)
+        // This allows us to show a proper error message rather than "provider not found"
+        return this.services[this.providerOrder[0]];
+    }
+
+    /**
+     * Get the preferred provider based on configuration
+     */
+    getPreferredProvider(): string {
+        this.ensureInitialized();
+
+        // Return the first available provider in the order
+        for (const providerName of this.providerOrder) {
+            if (this.services[providerName].isAvailable()) {
+                return providerName;
+            }
+        }
+
+        // Return the first provider as fallback
+        return this.providerOrder[0];
+    }
+
+    /**
+     * Check if a specific provider is available
+     */
+    isProviderAvailable(provider: string): boolean {
+        return this.services[provider as ServiceProviders]?.isAvailable() ?? false;
+    }
+
+    /**
+     * Get metadata about a provider
+     */
+    getProviderMetadata(provider: string): ProviderMetadata | null {
+        const service = this.services[provider as ServiceProviders];
+        if (!service) {
+            return null;
+        }
+
+        return {
+            name: provider,
+            capabilities: {
+                chat: true,
+                embeddings: provider !== 'anthropic', // Anthropic doesn't have embeddings
+                streaming: true,
+                functionCalling: provider === 'openai' // Only OpenAI has function calling
+            },
+            models: ['default'], // Placeholder, could be populated from the service
+            defaultModel: 'default'
+        };
+    }
+
+    /**
+     * Error handler that properly types the error object
+     */
+    private handleError(error: unknown): string {
+        if (error instanceof Error) {
+            return error.message || String(error);
+        }
+        return String(error);
+    }
+}
+
+// Don't create singleton immediately, use a lazy-loading pattern
+let instance: AIServiceManager | null = null;
+
+/**
+ * Get the AIServiceManager instance (creates it if not already created)
+ */
+function getInstance(): AIServiceManager {
+    if (!instance) {
+        instance = new AIServiceManager();
+    }
+    return instance;
+}
+
+export default {
+    getInstance,
+    // Also export methods directly for convenience
+    isAnyServiceAvailable(): boolean {
+        return getInstance().isAnyServiceAvailable();
+    },
+    getAvailableProviders() {
+        return getInstance().getAvailableProviders();
+    },
+    async generateChatCompletion(messages: Message[], options: ChatCompletionOptions = {}): Promise<ChatResponse> {
+        return getInstance().generateChatCompletion(messages, options);
+    },
+    // Add validateEmbeddingProviders method
+    async validateEmbeddingProviders(): Promise<string | null> {
+        return getInstance().validateEmbeddingProviders();
+    },
+    // Context and index related methods
+    getContextExtractor() {
+        return getInstance().getContextExtractor();
+    },
+    getContextService() {
+        return getInstance().getContextService();
+    },
+    getIndexService() {
+        return getInstance().getIndexService();
+    },
+    // Agent tools related methods
+    // Tools are now initialized in the constructor
+    getAgentTools() {
+        return getInstance().getAgentTools();
+    },
+    getVectorSearchTool() {
+        return getInstance().getVectorSearchTool();
+    },
+    getNoteNavigatorTool() {
+        return getInstance().getNoteNavigatorTool();
+    },
+    getQueryDecompositionTool() {
+        return getInstance().getQueryDecompositionTool();
+    },
+    getContextualThinkingTool() {
+        return getInstance().getContextualThinkingTool();
+    },
+    async getAgentToolsContext(
+        noteId: string,
+        query: string,
+        showThinking: boolean = false,
+        relevantNotes: NoteSearchResult[] = []
+    ): Promise<string> {
+        return getInstance().getAgentToolsContext(
+            noteId,
+            query,
+            showThinking,
+            relevantNotes
+        );
+    },
+    // New methods
+    getService(provider?: string): AIService {
+        return getInstance().getService(provider);
+    },
+    getPreferredProvider(): string {
+        return getInstance().getPreferredProvider();
+    },
+    isProviderAvailable(provider: string): boolean {
+        return getInstance().isProviderAvailable(provider);
+    },
+    getProviderMetadata(provider: string): ProviderMetadata | null {
+        return getInstance().getProviderMetadata(provider);
+    }
+};
+
+// Create an instance of ContextExtractor for backward compatibility
+const contextExtractor = new ContextExtractor();
diff --git a/src/services/llm/base_ai_service.ts b/src/services/llm/base_ai_service.ts
new file mode 100644
index 000000000..3c6e05bc7
--- /dev/null
+++ b/src/services/llm/base_ai_service.ts
@@ -0,0 +1,26 @@
+import options from '../options.js';
+import type { AIService, ChatCompletionOptions, ChatResponse, Message } from './ai_interface.js';
+import { DEFAULT_SYSTEM_PROMPT } from './constants/llm_prompt_constants.js';
+
+export abstract class BaseAIService implements AIService {
+    protected name: string;
+
+    constructor(name: string) {
+        this.name = name;
+    }
+
+    abstract generateChatCompletion(messages: Message[], options?: ChatCompletionOptions): Promise<ChatResponse>;
+
+    isAvailable(): boolean {
+        return options.getOptionBool('aiEnabled'); // Base check if AI is enabled globally
+    }
+
+    getName(): string {
+        return this.name;
+    }
+
+    protected getSystemPrompt(customPrompt?: string): string {
+        // Use prompt from constants file if no custom prompt is provided
+        return customPrompt || DEFAULT_SYSTEM_PROMPT;
+    }
+}
diff --git a/src/services/llm/chat/handlers/context_handler.ts b/src/services/llm/chat/handlers/context_handler.ts
new file mode 100644
index 000000000..c5af21116
--- /dev/null
+++ b/src/services/llm/chat/handlers/context_handler.ts
@@ -0,0 +1,168 @@
+/**
+ * Handler for LLM context management
+ */
+import log from "../../../log.js";
+import becca from "../../../../becca/becca.js";
+import vectorStore from "../../embeddings/index.js";
+import providerManager from "../../providers/providers.js";
+import contextService from "../../context/services/context_service.js";
+import type { NoteSource } from "../../interfaces/chat_session.js";
+import { SEARCH_CONSTANTS } from '../../constants/search_constants.js';
+
+/**
+ * Handles context management for LLM chat
+ */
+export class ContextHandler {
+    /**
+     * Find relevant notes based on search query
+     * @param content The search content
+     * @param contextNoteId Optional note ID for context
+     * @param limit Maximum number of results to return
+     * @returns Array of relevant note sources
+     */
+    static async findRelevantNotes(content: string, contextNoteId: string | null = null, limit = 5): Promise<NoteSource[]> {
+        try {
+            // If content is too short, don't bother
+            if (content.length < 3) {
+                return [];
+            }
+
+            // Check if embeddings are available
+            const enabledProviders = await providerManager.getEnabledEmbeddingProviders();
+            if (enabledProviders.length === 0) {
+                log.info("No embedding providers available, can't find relevant notes");
+                return [];
+            }
+
+            // Get the embedding for the query
+            const provider = enabledProviders[0];
+            const embedding = await provider.generateEmbeddings(content);
+
+            let results;
+            if (contextNoteId) {
+                // For branch context, get notes specifically from that branch
+                const contextNote = becca.notes[contextNoteId];
+                if (!contextNote) {
+                    return [];
+                }
+
+                const sql = require("../../../../services/sql.js").default;
+                const childBranches = await sql.getRows(`
+                    SELECT branches.* FROM branches
+                    WHERE branches.parentNoteId = ?
+                    AND branches.isDeleted = 0
+                `, [contextNoteId]);
+
+                const childNoteIds = childBranches.map((branch: any) => branch.noteId);
+
+                // Include the context note itself
+                childNoteIds.push(contextNoteId);
+
+                // Find similar notes in this context
+                results = [];
+
+                for (const noteId of childNoteIds) {
+                    const noteEmbedding = await vectorStore.getEmbeddingForNote(
+                        noteId,
+                        provider.name,
+                        provider.getConfig().model
+                    );
+
+                    if (noteEmbedding) {
+                        const similarity = vectorStore.cosineSimilarity(
+                            embedding,
+                            noteEmbedding.embedding
+                        );
+
+                        if (similarity > SEARCH_CONSTANTS.VECTOR_SEARCH.EXACT_MATCH_THRESHOLD) {
+                            results.push({
+                                noteId,
+                                similarity
+                            });
+                        }
+                    }
+                }
+
+                // Sort by similarity
+                results.sort((a, b) => b.similarity - a.similarity);
+                results = results.slice(0, limit);
+            } else {
+                // General search across all notes
+                results = await vectorStore.findSimilarNotes(
+                    embedding,
+                    provider.name,
+                    provider.getConfig().model,
+                    limit
+                );
+            }
+
+            // Format the results
+            const sources: NoteSource[] = [];
+
+            for (const result of results) {
+                const note = becca.notes[result.noteId];
+                if (!note) continue;
+
+                let noteContent: string | undefined = undefined;
+                if (note.type === 'text') {
+                    const content = note.getContent();
+                    // Handle both string and Buffer types
+                    noteContent = typeof content === 'string' ? content :
+                        content instanceof Buffer ? content.toString('utf8') : undefined;
+                }
+
+                sources.push({
+                    noteId: result.noteId,
+                    title: note.title,
+                    content: noteContent,
+                    similarity: result.similarity,
+                    branchId: note.getBranches()[0]?.branchId
+                });
+            }
+
+            return sources;
+        } catch (error: any) {
+            log.error(`Error finding relevant notes: ${error.message}`);
+            return [];
+        }
+    }
+
+    /**
+     * Process enhanced context using the context service
+     * @param query Query to process
+     * @param contextNoteId Optional note ID for context
+     * @param showThinking Whether to show thinking process
+     */
+    static async processEnhancedContext(query: string, llmService: any, options: {
+        contextNoteId?: string,
+        showThinking?: boolean
+    }) {
+        // Use the Trilium-specific approach
+        const contextNoteId = options.contextNoteId || null;
+        const showThinking = options.showThinking || false;
+
+        // Log that we're calling contextService with the parameters
+        log.info(`Using enhanced context with: noteId=${contextNoteId}, showThinking=${showThinking}`);
+
+        // Call context service for processing
+        const results = await contextService.processQuery(
+            query,
+            llmService,
+            {
+                contextNoteId,
+                showThinking
+            }
+        );
+
+        // Return the generated context and sources
+        return {
+            context: results.context,
+            sources: results.sources.map(source => ({
+                noteId: source.noteId,
+                title: source.title,
+                content: source.content || undefined, // Convert null to undefined
+                similarity: source.similarity
+            }))
+        };
+    }
+}
diff --git a/src/services/llm/chat/handlers/stream_handler.ts b/src/services/llm/chat/handlers/stream_handler.ts
new file mode 100644
index 000000000..3aeb26d83
--- /dev/null
+++ b/src/services/llm/chat/handlers/stream_handler.ts
@@ -0,0 +1,368 @@
+/**
+ * Handler for streaming LLM responses
+ */
+import log from "../../../log.js";
+import type { Response } from "express";
+import type { StreamChunk } from "../../ai_interface.js";
+import type { LLMStreamMessage } from "../../interfaces/chat_ws_messages.js";
+import type { ChatSession } from "../../interfaces/chat_session.js";
+
+/**
+ * Handles streaming of LLM responses via WebSocket
+ */
+export class StreamHandler {
+    /**
+     * Handle streaming response via WebSocket
+     *
+     * This method processes LLM responses and sends them incrementally via WebSocket
+     * to the client, supporting both text content and tool execution status updates.
+     *
+     * @param res Express response object
+     * @param aiMessages Messages to send to the LLM
+     * @param chatOptions Options for the chat completion
+     * @param service LLM service to use
+     * @param session Chat session for storing the response
+     */
+    static async handleStreamingResponse(
+        res: Response,
+        aiMessages: any[],
+        chatOptions: any,
+        service: any,
+        session: ChatSession
+    ): Promise<void> {
+        // The client receives a success response for their HTTP request,
+        // but the actual content will be streamed via WebSocket
+        res.json({ success: true, message: 'Streaming response started' });
+
+        // Import the WebSocket service
+        const wsService = (await import('../../../ws.js')).default;
+
+        let messageContent = '';
+        const chatNoteId = session.id;
+
+        // Immediately send an initial message to confirm WebSocket connection is working
+        // This helps prevent timeouts on the client side
+        wsService.sendMessageToAllClients({
+            type: 'llm-stream',
+            chatNoteId,
+            thinking: 'Preparing response...'
+        } as LLMStreamMessage);
+
+        try {
+            // Import the tool handler
+            const { ToolHandler } = await import('./tool_handler.js');
+
+            // Generate the LLM completion with streaming enabled
+            const response = await service.generateChatCompletion(aiMessages, {
+                ...chatOptions,
+                stream: true
+            });
+
+            // If the model doesn't support streaming via .stream() method or returns tool calls,
+            // we'll handle it specially
+            if (response.tool_calls && response.tool_calls.length > 0) {
+                // Send thinking state notification via WebSocket
+                wsService.sendMessageToAllClients({
+                    type: 'llm-stream',
+                    chatNoteId,
+                    thinking: 'Analyzing tools needed for this request...'
+                } as LLMStreamMessage);
+
+                try {
+                    // Execute the tools
+                    const toolResults = await ToolHandler.executeToolCalls(response, chatNoteId);
+
+                    // For each tool execution, send progress update via WebSocket
+                    for (const toolResult of toolResults) {
+                        wsService.sendMessageToAllClients({
+                            type: 'llm-stream',
+                            chatNoteId,
+                            toolExecution: {
+                                action: 'complete',
+                                tool: toolResult.name,
+                                result: toolResult.content.substring(0, 100) + (toolResult.content.length > 100 ? '...' : '')
+                            }
+                        } as LLMStreamMessage);
+                    }
+
+                    // Make follow-up request with tool results
+                    const toolMessages = [...aiMessages, {
+                        role: 'assistant',
+                        content: response.text || '',
+                        tool_calls: response.tool_calls
+                    }, ...toolResults];
+
+                    // Preserve streaming for follow-up if it was enabled in the original request
+                    const followUpOptions = {
+                        ...chatOptions,
+                        // Only disable streaming if it wasn't explicitly requested
+                        stream: chatOptions.stream === true,
+                        // Allow tools but track iterations to prevent infinite loops
+                        enableTools: true,
+                        maxToolIterations: chatOptions.maxToolIterations || 5,
+                        currentToolIteration: 1 // Start counting tool iterations
+                    };
+
+                    const followUpResponse = await service.generateChatCompletion(toolMessages, followUpOptions);
+
+                    await this.processStreamedResponse(
+                        followUpResponse,
+                        wsService,
+                        chatNoteId,
+                        session,
+                        toolMessages,
+                        followUpOptions,
+                        service
+                    );
+                } catch (toolError: any) {
+                    log.error(`Error executing tools: ${toolError.message}`);
+
+                    // Send error via WebSocket with done flag
+                    wsService.sendMessageToAllClients({
+                        type: 'llm-stream',
+                        chatNoteId,
+                        error: `Error executing tools: ${toolError instanceof Error ? toolError.message : 'Unknown error'}`,
+                        done: true
+                    } as LLMStreamMessage);
+                }
+            } else if (response.stream) {
+                // Handle standard streaming through the stream() method
+                log.info(`Provider ${service.getName ? service.getName() : 'unknown'} supports streaming via stream() method`);
+
+                // Store information about the model and provider in session metadata
+                session.metadata.model = response.model || session.metadata.model;
+                session.metadata.provider = response.provider || session.metadata.provider;
+                session.metadata.lastUpdated = new Date().toISOString();
+
+                await this.processStreamedResponse(
+                    response,
+                    wsService,
+                    chatNoteId,
+                    session
+                );
+            } else {
+                log.info(`Provider ${service.getName ? service.getName() : 'unknown'} does not support streaming via stream() method, falling back to single response`);
+
+                // If streaming isn't available, send the entire response at once
+                messageContent = response.text || '';
+
+                // Send via WebSocket - include both content and done flag in same message
+                wsService.sendMessageToAllClients({
+                    type: 'llm-stream',
+                    chatNoteId,
+                    content: messageContent,
+                    done: true
+                } as LLMStreamMessage);
+
+                log.info(`Complete response sent`);
+
+                // Store the full response in the session
+                session.messages.push({
+                    role: 'assistant',
+                    content: messageContent,
+                    timestamp: new Date()
+                });
+            }
+        } catch (streamingError: any) {
+            log.error(`Streaming error: ${streamingError.message}`);
+
+            // Import the WebSocket service directly in case it wasn't imported earlier
+            const wsService = (await import('../../../ws.js')).default;
+
+            // Send error via WebSocket
+            wsService.sendMessageToAllClients({
+                type: 'llm-stream',
+                chatNoteId,
+                error: `Error generating response: ${streamingError instanceof Error ? streamingError.message : 'Unknown error'}`
+            } as LLMStreamMessage);
+
+            // Signal completion
+            wsService.sendMessageToAllClients({
+                type: 'llm-stream',
+                chatNoteId,
+                done: true
+            } as LLMStreamMessage);
+        }
+    }
+
+    /**
+     * Process a streamed response from an LLM
+     */
+    private static async processStreamedResponse(
+        response: any,
+        wsService: any,
+        chatNoteId: string,
+        session: ChatSession,
+        toolMessages?: any[],
+        followUpOptions?: any,
+        service?: any
+    ): Promise<void> {
+        // Import tool handler lazily to avoid circular dependencies
+        const { ToolHandler } = await import('./tool_handler.js');
+
+        let messageContent = '';
+
+        try {
+            await response.stream(async (chunk: StreamChunk) => {
+                if (chunk.text) {
+                    messageContent += chunk.text;
+
+                    // Enhanced logging for each chunk
+                    log.info(`Received stream chunk with ${chunk.text.length} chars of text, done=${!!chunk.done}`);
+
+                    // Send each individual chunk via WebSocket as it arrives
+                    wsService.sendMessageToAllClients({
+                        type: 'llm-stream',
+                        chatNoteId,
+                        content: chunk.text,
+                        done: !!chunk.done, // Include done flag with each chunk
+                        // Include any raw data from the provider that might contain thinking/tool info
+                        ...(chunk.raw ? { raw: chunk.raw } : {})
+                    } as LLMStreamMessage);
+
+                    // Log the first chunk (useful for debugging)
+                    if (messageContent.length === chunk.text.length) {
+                        log.info(`First stream chunk received: "${chunk.text.substring(0, 50)}${chunk.text.length > 50 ? '...' : ''}"`);
+                    }
+                }
+
+                // If the provider indicates this is "thinking" state, relay that
+                if (chunk.raw?.thinking) {
+                    wsService.sendMessageToAllClients({
+                        type: 'llm-stream',
+                        chatNoteId,
+                        thinking: chunk.raw.thinking
+                    } as LLMStreamMessage);
+                }
+
+                // If the provider indicates tool execution, relay that
+                if (chunk.raw?.toolExecution) {
+                    wsService.sendMessageToAllClients({
+                        type: 'llm-stream',
+                        chatNoteId,
+                        toolExecution: chunk.raw.toolExecution
+                    } as LLMStreamMessage);
+                }
+
+                // Handle direct tool_calls in the response (for OpenAI)
+                if (chunk.tool_calls && chunk.tool_calls.length > 0) {
+                    log.info(`Detected direct tool_calls in stream chunk: ${chunk.tool_calls.length} tools`);
+
+                    // Send tool execution notification
+                    wsService.sendMessageToAllClients({
+                        type: 'tool_execution_start',
+                        chatNoteId
+                    } as LLMStreamMessage);
+
+                    // Process each tool call
+                    for (const toolCall of chunk.tool_calls) {
+                        // Process arguments
+                        let args = toolCall.function?.arguments;
+                        if (typeof args === 'string') {
+                            try {
+                                args = JSON.parse(args);
+                            } catch (e) {
+                                log.info(`Could not parse tool arguments as JSON: ${e}`);
+                                args = { raw: args };
+                            }
+                        }
+
+                        // Format into a standardized tool execution message
+                        wsService.sendMessageToAllClients({
+                            type: 'tool_result',
+                            chatNoteId,
+                            toolExecution: {
+                                action: 'executing',
+                                tool: toolCall.function?.name || 'unknown',
+                                toolCallId: toolCall.id,
+                                args: args
+                            }
+                        } as LLMStreamMessage);
+                    }
+                }
+
+                // Signal completion when done
+                if (chunk.done) {
+                    log.info(`Stream completed, total content: ${messageContent.length} chars`);
+
+                    // Check if there are more tool calls to execute (recursive tool calling)
+                    if (service && toolMessages && followUpOptions &&
+                        response.tool_calls && response.tool_calls.length > 0 &&
+                        followUpOptions.currentToolIteration < followUpOptions.maxToolIterations) {
+
+                        log.info(`Found ${response.tool_calls.length} more tool calls in iteration ${followUpOptions.currentToolIteration}`);
+
+                        // Execute these tool calls in another iteration
+                        const assistantMessage = {
+                            role: 'assistant' as const,
+                            content: messageContent,
+                            tool_calls: response.tool_calls
+                        };
+
+                        // Execute the next round of tools
+                        const nextToolResults = await ToolHandler.executeToolCalls(response, chatNoteId);
+
+                        // Create a new messages array with the latest tool results
+                        const nextToolMessages = [...toolMessages, assistantMessage, ...nextToolResults];
+
+                        // Increment the tool iteration counter for the next call
+                        const nextFollowUpOptions = {
+                            ...followUpOptions,
+                            currentToolIteration: followUpOptions.currentToolIteration + 1
+                        };
+
+                        log.info(`Making another follow-up request (iteration ${nextFollowUpOptions.currentToolIteration}/${nextFollowUpOptions.maxToolIterations})`);
+
+                        // Make another follow-up request
+                        const nextResponse = await service.generateChatCompletion(nextToolMessages, nextFollowUpOptions);
+
+                        // Process the next response recursively
+                        await this.processStreamedResponse(
+                            nextResponse,
+                            wsService,
+                            chatNoteId,
+                            session,
+                            nextToolMessages,
+                            nextFollowUpOptions,
+                            service
+                        );
+                    } else {
+                        // Only send final done message if it wasn't already sent with content
+                        // This ensures we don't duplicate the content but still mark completion
+                        if (!chunk.text) {
+                            log.info(`No content in final chunk, sending explicit completion message`);
+
+                            // Send final message with done flag only (no content)
+                            wsService.sendMessageToAllClients({
+                                type: 'llm-stream',
+                                chatNoteId,
+                                done: true
+                            } as LLMStreamMessage);
+                        }
+
+                        // Store the full response in the session
+                        session.messages.push({
+                            role: 'assistant',
+                            content: messageContent,
+                            timestamp: new Date()
+                        });
+                    }
+                }
+            });
+
+            log.info(`Streaming completed successfully`);
+        } catch (streamError: any) {
+            log.error(`Error during streaming: ${streamError.message}`);
+
+            // Report the error to the client
+            wsService.sendMessageToAllClients({
+                type: 'llm-stream',
+                chatNoteId,
+                error: `Error during streaming: ${streamError instanceof Error ? streamError.message : 'Unknown error'}`,
+                done: true
+            } as LLMStreamMessage);
+
+            throw streamError;
+        }
+    }
+}
diff --git a/src/services/llm/chat/handlers/tool_handler.ts b/src/services/llm/chat/handlers/tool_handler.ts
new file mode 100644
index 000000000..076664f63
--- /dev/null
+++ b/src/services/llm/chat/handlers/tool_handler.ts
@@ -0,0 +1,181 @@
+/**
+ * Handler for LLM tool executions
+ */
+import log from "../../../log.js";
+import type { Message } from "../../ai_interface.js";
+import SessionsStore from "../sessions_store.js";
+
+/**
+ * Handles the execution of LLM tools
+ */
+export class ToolHandler {
+    /**
+     * Execute tool calls from the LLM response
+     * @param response The LLM response containing tool calls
+     * @param chatNoteId Optional chat note ID for tracking
+     */
+    static async executeToolCalls(response: any, chatNoteId?: string): Promise<Message[]> {
+        log.info(`========== TOOL EXECUTION FLOW ==========`);
+        if (!response.tool_calls || response.tool_calls.length === 0) {
+            log.info(`No tool calls to execute, returning early`);
+            return [];
+        }
+
+        log.info(`Executing ${response.tool_calls.length} tool calls`);
+
+        try {
+            // Import tool registry directly to avoid circular dependencies
+            const toolRegistry = (await import('../../tools/tool_registry.js')).default;
+
+            // Check if tools are available
+            const availableTools = toolRegistry.getAllTools();
+            log.info(`Available tools in registry: ${availableTools.length}`);
+
+            if (availableTools.length === 0) {
+                log.error('No tools available in registry for execution');
+
+                // Try to initialize tools
+                try {
+                    // Ensure tools are initialized
+                    const initResult = await this.ensureToolsInitialized();
+                    if (!initResult) {
+                        throw new Error('Failed to initialize tools');
+                    }
+                } catch (error: unknown) {
+                    const errorMessage = error instanceof Error ? error.message : String(error);
+                    log.error(`Failed to initialize tools: ${errorMessage}`);
+                    throw new Error('Tool execution failed: No tools available');
+                }
+            }
+
+            // Execute each tool call and collect results
+            const toolResults = await Promise.all(response.tool_calls.map(async (toolCall: any) => {
+                try {
+                    log.info(`Executing tool: ${toolCall.function.name}, ID: ${toolCall.id || 'unknown'}`);
+
+                    // Get the tool from registry
+                    const tool = toolRegistry.getTool(toolCall.function.name);
+                    if (!tool) {
+                        throw new Error(`Tool not found: ${toolCall.function.name}`);
+                    }
+
+                    // Parse arguments
+                    let args;
+                    if (typeof toolCall.function.arguments === 'string') {
+                        try {
+                            args = JSON.parse(toolCall.function.arguments);
+                        } catch (e: unknown) {
+                            log.error(`Failed to parse tool arguments: ${e instanceof Error ? e.message : String(e)}`);
+
+                            // Try cleanup and retry
+                            try {
+                                const cleaned = toolCall.function.arguments
+                                    .replace(/^['"]|['"]$/g, '') // Remove surrounding quotes
+                                    .replace(/\\"/g, '"')        // Replace escaped quotes
+                                    .replace(/([{,])\s*'([^']+)'\s*:/g, '$1"$2":') // Replace single quotes around property names
+                                    .replace(/([{,])\s*(\w+)\s*:/g, '$1"$2":');    // Add quotes around unquoted property names
+
+                                args = JSON.parse(cleaned);
+                            } catch (cleanErr) {
+                                // If all parsing fails, use as-is
+                                args = { text: toolCall.function.arguments };
+                            }
+                        }
+                    } else {
+                        args = toolCall.function.arguments;
+                    }
+
+                    // Log what we're about to execute
+                    log.info(`Executing tool with arguments: ${JSON.stringify(args)}`);
+
+                    // Execute the tool and get result
+                    const startTime = Date.now();
+                    const result = await tool.execute(args);
+                    const executionTime = Date.now() - startTime;
+
+                    log.info(`Tool execution completed in ${executionTime}ms`);
+
+                    // Log the result
+                    const resultPreview = typeof result === 'string'
+                        ? result.substring(0, 100) + (result.length > 100 ? '...' : '')
+                        : JSON.stringify(result).substring(0, 100) + '...';
+                    log.info(`Tool result: ${resultPreview}`);
+
+                    // Record tool execution in session if chatNoteId is provided
+                    if (chatNoteId) {
+                        SessionsStore.recordToolExecution(chatNoteId, toolCall, typeof result === 'string' ? result : JSON.stringify(result));
+                    }
+
+                    // Format result as a proper message
+                    return {
+                        role: 'tool',
+                        content: typeof result === 'string' ? result : JSON.stringify(result),
+                        name: toolCall.function.name,
+                        tool_call_id: toolCall.id || `tool-${Date.now()}-${Math.random().toString(36).substring(2, 9)}`
+                    };
+                } catch (error: any) {
+                    log.error(`Error executing tool ${toolCall.function.name}: ${error.message}`);
+
+                    // Record error in session if chatNoteId is provided
+                    if (chatNoteId) {
+                        SessionsStore.recordToolExecution(chatNoteId, toolCall, '', error.message);
+                    }
+
+                    // Return error as tool result
+                    return {
+                        role: 'tool',
+                        content: `Error: ${error.message}`,
+                        name: toolCall.function.name,
+                        tool_call_id: toolCall.id || `tool-${Date.now()}-${Math.random().toString(36).substring(2, 9)}`
+                    };
+                }
+            }));
+
+            log.info(`Completed execution of ${toolResults.length} tools`);
+            return toolResults;
+        } catch (error: any) {
+            log.error(`Error in tool execution handler: ${error.message}`);
+            throw error;
+        }
+    }
+
+    /**
+     * Ensure LLM tools are initialized
+     */
+    static async ensureToolsInitialized(): Promise<boolean> {
+        try {
+            log.info("Checking LLM tool initialization...");
+
+            // Import tool registry
+            const toolRegistry = (await import('../../tools/tool_registry.js')).default;
+
+            // Check if tools are already initialized
+            const registeredTools = toolRegistry.getAllTools();
+
+            if (registeredTools.length === 0) {
+                log.info("No tools found in registry.");
+                log.info("Note: Tools should be initialized in the AIServiceManager constructor.");
+
+                // Create AI service manager instance to trigger tool initialization
+                const aiServiceManager = (await import('../../ai_service_manager.js')).default;
+                aiServiceManager.getInstance();
+
+                // Check again after AIServiceManager instantiation
+                const tools = toolRegistry.getAllTools();
+                log.info(`After AIServiceManager instantiation: ${tools.length} tools available`);
+            } else {
+                log.info(`LLM tools already initialized: ${registeredTools.length} tools available`);
+            }
+
+            // Get all available tools for logging
+            const availableTools = toolRegistry.getAllTools().map(t => t.definition.function.name);
+            log.info(`Available tools: ${availableTools.join(', ')}`);
+
+            log.info("LLM tools initialized successfully: " + availableTools.length + " tools available");
+            return true;
+        } catch (error) {
+            log.error(`Failed to initialize LLM tools: ${error}`);
+            return false;
+        }
+    }
+}
diff --git a/src/services/llm/chat/index.ts b/src/services/llm/chat/index.ts
new file mode 100644
index 000000000..d82554229
--- /dev/null
+++ b/src/services/llm/chat/index.ts
@@ -0,0 +1,29 @@
+/**
+ * Chat module export
+ */
+import restChatService from './rest_chat_service.js';
+import sessionsStore from './sessions_store.js';
+import { ContextHandler } from './handlers/context_handler.js';
+import { ToolHandler } from './handlers/tool_handler.js';
+import { StreamHandler } from './handlers/stream_handler.js';
+import * as messageFormatter from './utils/message_formatter.js';
+import type { ChatSession, ChatMessage, NoteSource } from '../interfaces/chat_session.js';
+import type { LLMStreamMessage } from '../interfaces/chat_ws_messages.js';
+
+// Export components
+export {
+    restChatService as default,
+    sessionsStore,
+    ContextHandler,
+    ToolHandler,
+    StreamHandler,
+    messageFormatter
+};
+
+// Export types
+export type {
+    ChatSession,
+    ChatMessage,
+    NoteSource,
+    LLMStreamMessage
+};
diff --git a/src/services/llm/chat/rest_chat_service.ts b/src/services/llm/chat/rest_chat_service.ts
new file mode 100644
index 000000000..0a400ad91
--- /dev/null
+++ b/src/services/llm/chat/rest_chat_service.ts
@@ -0,0 +1,680 @@
+/**
+ * Service to handle chat API interactions
+ */
+import log from "../../log.js";
+import type { Request, Response } from "express";
+import type { Message, ChatCompletionOptions } from "../ai_interface.js";
+import { AIServiceManager } from "../ai_service_manager.js";
+import { ChatPipeline } from "../pipeline/chat_pipeline.js";
+import type { ChatPipelineInput } from "../pipeline/interfaces.js";
+import options from "../../options.js";
+import { SEARCH_CONSTANTS } from '../constants/search_constants.js';
+
+// Import our refactored modules
+import { ContextHandler } from "./handlers/context_handler.js";
+import { ToolHandler } from "./handlers/tool_handler.js";
+import { StreamHandler } from "./handlers/stream_handler.js";
+import SessionsStore from "./sessions_store.js";
+import * as MessageFormatter from "./utils/message_formatter.js";
+import type { NoteSource } from "../interfaces/chat_session.js";
+import type { LLMStreamMessage } from "../interfaces/chat_ws_messages.js";
+import type { ChatMessage } from '../interfaces/chat_session.js';
+import type { ChatSession } from '../interfaces/chat_session.js';
+
+/**
+ * Service to handle chat API interactions
+ */
+class RestChatService {
+    /**
+     * Check if the database is initialized
+     */
+    isDatabaseInitialized(): boolean {
+        try {
+            options.getOption('initialized');
+            return true;
+        } catch (error) {
+            return false;
+        }
+    }
+
+    /**
+     * Check if AI services are available
+     */
+    safelyUseAIManager(): boolean {
+        // Only use AI manager if database is initialized
+        if (!this.isDatabaseInitialized()) {
+            log.info("AI check failed: Database is not initialized");
+            return false;
+        }
+
+        // Try to access the manager - will create instance only if needed
+        try {
+            // Create local instance to avoid circular references
+            const aiManager = new AIServiceManager();
+
+            if (!aiManager) {
+                log.info("AI check failed: AI manager module is not available");
+                return false;
+            }
+
+            const isAvailable = aiManager.isAnyServiceAvailable();
+            log.info(`AI service availability check result: ${isAvailable}`);
+
+            if (isAvailable) {
+                // Additional diagnostics
+                try {
+                    const providers = aiManager.getAvailableProviders();
+                    log.info(`Available AI providers: ${providers.join(', ')}`);
+                } catch (err) {
+                    log.info(`Could not get available providers: ${err}`);
+                }
+            }
+
+            return isAvailable;
+        } catch (error) {
+            log.error(`Error accessing AI service manager: ${error}`);
+            return false;
+        }
+    }
+
+    /**
+     * Handle a message sent to an LLM and get a response
+     */
+    async handleSendMessage(req: Request, res: Response) {
+        log.info("=== Starting handleSendMessage ===");
+        try {
+            // Extract parameters differently based on the request method
+            let content, useAdvancedContext, showThinking, chatNoteId;
+
+            if (req.method === 'POST') {
+                // For POST requests, get content from the request body
+                const requestBody = req.body || {};
+                content = requestBody.content;
+                useAdvancedContext = requestBody.useAdvancedContext || false;
+                showThinking = requestBody.showThinking || false;
+
+                // Add logging for POST requests
+                log.info(`LLM POST message: chatNoteId=${req.params.chatNoteId}, useAdvancedContext=${useAdvancedContext}, showThinking=${showThinking}, contentLength=${content ? content.length : 0}`);
+            } else if (req.method === 'GET') {
+                // For GET (streaming) requests, get parameters from query params and body
+                // For streaming requests, we need the content from the body
+                useAdvancedContext = req.query.useAdvancedContext === 'true' || (req.body && req.body.useAdvancedContext === true);
+                showThinking = req.query.showThinking === 'true' || (req.body && req.body.showThinking === true);
+                content = req.body && req.body.content ? req.body.content : '';
+
+                // Add detailed logging for GET requests
+                log.info(`LLM GET stream: chatNoteId=${req.params.chatNoteId}, useAdvancedContext=${useAdvancedContext}, showThinking=${showThinking}`);
+                log.info(`Parameters from query: useAdvancedContext=${req.query.useAdvancedContext}, showThinking=${req.query.showThinking}`);
+                log.info(`Parameters from body: useAdvancedContext=${req.body?.useAdvancedContext}, showThinking=${req.body?.showThinking}, content=${content ? `${content.substring(0, 20)}...` : 'none'}`);
+            }
+
+            // Get chatNoteId from URL params
+            chatNoteId = req.params.chatNoteId;
+
+            // For GET requests, ensure we have the stream parameter
+            if (req.method === 'GET' && req.query.stream !== 'true') {
+                throw new Error('Stream parameter must be set to true for GET/streaming requests');
+            }
+
+            // For POST requests, validate the content
+            if (req.method === 'POST' && (!content || typeof content !== 'string' || content.trim().length === 0)) {
+                throw new Error('Content cannot be empty');
+            }
+
+            // Get or create session from Chat Note
+            let session = await this.getOrCreateSessionFromChatNote(chatNoteId, req.method === 'POST');
+
+            // If no session found and we're not allowed to create one (GET request)
+            if (!session && req.method === 'GET') {
+                throw new Error('Chat Note not found, cannot create session for streaming');
+            }
+
+            // For POST requests, if no Chat Note exists, create a new one
+            if (!session && req.method === 'POST') {
+                log.info(`No Chat Note found for ${chatNoteId}, creating a new Chat Note and session`);
+
+                // Create a new Chat Note via the storage service
+                //const chatStorageService = (await import('../../llm/chat_storage_service.js')).default;
+                //const newChat = await chatStorageService.createChat('New Chat');
+
+                // Use the new Chat Note's ID for the session
+                session = SessionsStore.createSession({
+                    //title: newChat.title,
+                    chatNoteId: chatNoteId
+                });
+
+                // Update the session ID to match the Chat Note ID
+                session.id = chatNoteId;
+
+                log.info(`Created new Chat Note and session with ID: ${session.id}`);
+
+                // Update the parameter to use the new ID
+                chatNoteId = session.id;
+            }
+
+            // At this point, session should never be null
+            // TypeScript doesn't know this, so we'll add a check
+            if (!session) {
+                // This should never happen due to our logic above
+                throw new Error('Failed to create or retrieve session');
+            }
+
+            // Update session last active timestamp
+            SessionsStore.touchSession(session.id);
+
+            // For POST requests, store the user message
+            if (req.method === 'POST' && content && session) {
+                // Add message to session
+                session.messages.push({
+                    role: 'user',
+                    content,
+                    timestamp: new Date()
+                });
+
+                // Log a preview of the message
+                log.info(`Processing LLM message: "${content.substring(0, 50)}${content.length > 50 ? '...' : ''}"`);
+            }
+
+            // Check if AI services are enabled before proceeding
+            const aiEnabled = await options.getOptionBool('aiEnabled');
+            log.info(`AI enabled setting: ${aiEnabled}`);
+            if (!aiEnabled) {
+                log.info("AI services are disabled by configuration");
+                return {
+                    error: "AI features are disabled. Please enable them in the settings."
+                };
+            }
+
+            // Check if AI services are available
+            log.info("Checking if AI services are available...");
+            if (!this.safelyUseAIManager()) {
+                log.info("AI services are not available - checking for specific issues");
+
+                try {
+                    // Create a direct instance to avoid circular references
+                    const aiManager = new AIServiceManager();
+
+                    if (!aiManager) {
+                        log.error("AI service manager is not initialized");
+                        return {
+                            error: "AI service is not properly initialized. Please check your configuration."
+                        };
+                    }
+
+                    const availableProviders = aiManager.getAvailableProviders();
+                    if (availableProviders.length === 0) {
+                        log.error("No AI providers are available");
+                        return {
+                            error: "No AI providers are configured or available. Please check your AI settings."
+                        };
+                    }
+                } catch (err) {
+                    log.error(`Detailed AI service check failed: ${err}`);
+                }
+
+                return {
+                    error: "AI services are currently unavailable. Please check your configuration."
+                };
+            }
+
+            // Create direct instance to avoid circular references
+            const aiManager = new AIServiceManager();
+
+            // Get the default service - just use the first available one
+            const availableProviders = aiManager.getAvailableProviders();
+
+            if (availableProviders.length === 0) {
+                log.error("No AI providers are available after manager check");
+                return {
+                    error: "No AI providers are configured or available. Please check your AI settings."
+                };
+            }
+
+            // Use the first available provider
+            const providerName = availableProviders[0];
+            log.info(`Using AI provider: ${providerName}`);
+
+            // We know the manager has a 'services' property from our code inspection,
+            // but TypeScript doesn't know that from the interface.
+            // This is a workaround to access it
+            const service = (aiManager as any).services[providerName];
+
+            if (!service) {
+                log.error(`AI service for provider ${providerName} not found`);
+                return {
+                    error: `Selected AI provider (${providerName}) is not available. Please check your configuration.`
+                };
+            }
+
+            // Initialize tools
+            log.info("Initializing LLM agent tools...");
+            // Ensure tools are initialized to prevent tool execution issues
+            await ToolHandler.ensureToolsInitialized();
+
+            // Create and use the chat pipeline instead of direct processing
+            const pipeline = new ChatPipeline({
+                enableStreaming: req.method === 'GET',
+                enableMetrics: true,
+                maxToolCallIterations: 5
+            });
+
+            log.info("Executing chat pipeline...");
+
+            // Create options object for better tracking
+            const pipelineOptions = {
+                // Force useAdvancedContext to be a boolean, no matter what
+                useAdvancedContext: useAdvancedContext === true,
+                systemPrompt: session?.messages.find(m => m.role === 'system')?.content,
+                temperature: session?.metadata.temperature,
+                maxTokens: session?.metadata.maxTokens,
+                model: session?.metadata.model,
+                // Set stream based on request type, but ensure it's explicitly a boolean value
+                // GET requests or format=stream parameter indicates streaming should be used
+                stream: !!(req.method === 'GET' || req.query.format === 'stream' || req.query.stream === 'true'),
+                // Include chatNoteId for tracking tool executions
+                chatNoteId: chatNoteId
+            };
+
+            // Log the options to verify what's being sent to the pipeline
+            log.info(`Pipeline input options: ${JSON.stringify({
+                useAdvancedContext: pipelineOptions.useAdvancedContext,
+                stream: pipelineOptions.stream
+            })}`);
+
+            // Import the WebSocket service for direct access
+            const wsService = await import('../../ws.js');
+
+            // Create a stream callback wrapper
+            // This will ensure we properly handle all streaming messages
+            let messageContent = '';
+
+            // Prepare the pipeline input
+            const pipelineInput: ChatPipelineInput = {
+                messages: session.messages.map(msg => ({
+                    role: msg.role as 'user' | 'assistant' | 'system',
+                    content: msg.content
+                })),
+                query: content || '',  // Ensure query is always a string, even if content is null/undefined
+                noteId: session.noteContext ?? undefined,
+                showThinking: showThinking,
+                options: pipelineOptions,
+                streamCallback: req.method === 'GET' ? (data, done, rawChunk) => {
+                    try {
+                        // Use WebSocket service to send messages
+                        this.handleStreamCallback(
+                            data, done, rawChunk,
+                            wsService.default, chatNoteId,
+                            messageContent, session, res
+                        );
+                    } catch (error) {
+                        log.error(`Error in stream callback: ${error}`);
+
+                        // Try to send error message
+                        try {
+                            wsService.default.sendMessageToAllClients({
+                                type: 'llm-stream',
+                                chatNoteId: chatNoteId,
+                                error: `Stream error: ${error instanceof Error ? error.message : 'Unknown error'}`,
+                                done: true
+                            });
+
+                            // End the response
+                            res.write(`data: ${JSON.stringify({ error: 'Stream error', done: true })}\n\n`);
+                            res.end();
+                        } catch (e) {
+                            log.error(`Failed to send error message: ${e}`);
+                        }
+                    }
+                } : undefined
+            };
+
+            // Execute the pipeline
+            const response = await pipeline.execute(pipelineInput);
+
+            // Handle the response
+            if (req.method === 'POST') {
+                // Add assistant message to session
+                session.messages.push({
+                    role: 'assistant',
+                    content: response.text || '',
+                    timestamp: new Date()
+                });
+
+                // Extract sources if they're available
+                const sources = (response as any).sources || [];
+
+                // Store sources in the session metadata if they're present
+                if (sources.length > 0) {
+                    session.metadata.sources = sources;
+                    log.info(`Stored ${sources.length} sources in session metadata`);
+                }
+
+                // Return the response with complete metadata
+                return {
+                    content: response.text || '',
+                    sources: sources,
+                    metadata: {
+                        model: response.model || session.metadata.model,
+                        provider: response.provider || session.metadata.provider,
+                        temperature: session.metadata.temperature,
+                        maxTokens: session.metadata.maxTokens,
+                        lastUpdated: new Date().toISOString(),
+                        toolExecutions: session.metadata.toolExecutions || []
+                    }
+                };
+            } else {
+                // For streaming requests, we've already sent the response
+                return null;
+            }
+        } catch (processingError: any) {
+            log.error(`Error processing message: ${processingError}`);
+            return {
+                error: `Error processing your request: ${processingError.message}`
+            };
+        }
+    }
+
+    /**
+     * Handle stream callback for WebSocket communication
+     */
+    private handleStreamCallback(
+        data: string | null,
+        done: boolean,
+        rawChunk: any,
+        wsService: any,
+        chatNoteId: string,
+        messageContent: string,
+        session: any,
+        res: Response
+    ) {
+        // Only accumulate content that's actually text (not tool execution or thinking info)
+        if (data) {
+            messageContent += data;
+        }
+
+        // Create a message object with all necessary fields
+        const message: LLMStreamMessage = {
+            type: 'llm-stream',
+            chatNoteId: chatNoteId
+        };
+
+        // Add content if available - either the new chunk or full content on completion
+        if (data) {
+            message.content = data;
+        }
+
+        // Add thinking info if available in the raw chunk
+        if (rawChunk && 'thinking' in rawChunk && rawChunk.thinking) {
+            message.thinking = rawChunk.thinking as string;
+        }
+
+        // Add tool execution info if available in the raw chunk
+        if (rawChunk && 'toolExecution' in rawChunk && rawChunk.toolExecution) {
+            // Transform the toolExecution to match the expected format
+            const toolExec = rawChunk.toolExecution;
+            message.toolExecution = {
+                // Use optional chaining for all properties
+                tool: typeof toolExec.tool === 'string'
+                    ? toolExec.tool
+                    : toolExec.tool?.name,
+                result: toolExec.result,
+                // Map arguments to args
+                args: 'arguments' in toolExec ?
+                    (typeof toolExec.arguments === 'object' ?
+                        toolExec.arguments as Record<string, unknown> : {}) : {},
+                // Add additional properties if they exist
+                action: 'action' in toolExec ? toolExec.action as string : undefined,
+                toolCallId: 'toolCallId' in toolExec ? toolExec.toolCallId as string : undefined,
+                error: 'error' in toolExec ? toolExec.error as string : undefined
+            };
+        }
+
+        // Set done flag explicitly
+        message.done = done;
+
+        // On final message, include the complete content too
+        if (done) {
+            // Store the response in the session when done
+            session.messages.push({
+                role: 'assistant',
+                content: messageContent,
+                timestamp: new Date()
+            });
+        }
+
+        // Send message to all clients
+        wsService.sendMessageToAllClients(message);
+
+        // Log what was sent (first message and completion)
+        if (message.thinking || done) {
+            log.info(
+                `[WS-SERVER] Sending LLM stream message: chatNoteId=${chatNoteId}, content=${!!message.content}, contentLength=${message.content?.length || 0}, thinking=${!!message.thinking}, toolExecution=${!!message.toolExecution}, done=${done}`
+            );
+        }
+
+        // For GET requests, also send as server-sent events
+        // Prepare response data for JSON event
+        const responseData: any = {
+            content: data,
+            done
+        };
+
+        // Add tool execution if available
+        if (rawChunk?.toolExecution) {
+            responseData.toolExecution = rawChunk.toolExecution;
+        }
+
+        // Send the data as a JSON event
+        res.write(`data: ${JSON.stringify(responseData)}\n\n`);
+
+        if (done) {
+            res.end();
+        }
+    }
+
+    /**
+     * Create a new chat session
+     */
+    async createSession(req: Request, res: Response) {
+        try {
+            const options: any = req.body || {};
+            const title = options.title || 'Chat Session';
+
+            // Use the currentNoteId as the chatNoteId if provided
+            let chatNoteId = options.chatNoteId;
+
+            // If currentNoteId is provided but chatNoteId is not, use currentNoteId
+            if (!chatNoteId && options.currentNoteId) {
+                chatNoteId = options.currentNoteId;
+                log.info(`Using provided currentNoteId ${chatNoteId} as chatNoteId`);
+            }
+
+            // If we still don't have a chatNoteId, create a new Chat Note
+            if (!chatNoteId) {
+                // Create a new Chat Note via the storage service
+                const chatStorageService = (await import('../../llm/chat_storage_service.js')).default;
+                const newChat = await chatStorageService.createChat(title);
+                chatNoteId = newChat.id;
+                log.info(`Created new Chat Note with ID: ${chatNoteId}`);
+            }
+
+            // Create a new session through our session store
+            const session = SessionsStore.createSession({
+                chatNoteId,
+                title,
+                systemPrompt: options.systemPrompt,
+                contextNoteId: options.contextNoteId,
+                maxTokens: options.maxTokens,
+                model: options.model,
+                provider: options.provider,
+                temperature: options.temperature
+            });
+
+            return {
+                id: session.id,
+                title: session.title,
+                createdAt: session.createdAt,
+                noteId: chatNoteId // Return the note ID explicitly
+            };
+        } catch (error: any) {
+            log.error(`Error creating LLM session: ${error.message || 'Unknown error'}`);
+            throw new Error(`Failed to create LLM session: ${error.message || 'Unknown error'}`);
+        }
+    }
+
+    /**
+     * Get a specific chat session by ID
+     */
+    async getSession(req: Request, res: Response) {
+        try {
+            const { sessionId } = req.params;
+
+            // Check if session exists
+            const session = SessionsStore.getSession(sessionId);
+            if (!session) {
+                // Instead of throwing an error, return a structured 404 response
+                // that the frontend can handle gracefully
+                res.status(404).json({
+                    error: true,
+                    message: `Session with ID ${sessionId} not found`,
+                    code: 'session_not_found',
+                    sessionId
+                });
+                return null; // Return null to prevent further processing
+            }
+
+            // Return session with metadata and additional fields
+            return {
+                id: session.id,
+                title: session.title,
+                createdAt: session.createdAt,
+                lastActive: session.lastActive,
+                messages: session.messages,
+                noteContext: session.noteContext,
+                // Include additional fields for the frontend
+                sources: session.metadata.sources || [],
+                metadata: {
+                    model: session.metadata.model,
+                    provider: session.metadata.provider,
+                    temperature: session.metadata.temperature,
+                    maxTokens: session.metadata.maxTokens,
+                    lastUpdated: session.lastActive.toISOString(),
+                    // Include simplified tool executions if available
+                    toolExecutions: session.metadata.toolExecutions || []
+                }
+            };
+        } catch (error: any) {
+            log.error(`Error getting LLM session: ${error.message || 'Unknown error'}`);
+            throw new Error(`Failed to get session: ${error.message || 'Unknown error'}`);
+        }
+    }
+
+    /**
+     * Delete a chat session
+     */
+    async deleteSession(req: Request, res: Response) {
+        try {
+            const { sessionId } = req.params;
+
+            // Delete the session
+            const success = SessionsStore.deleteSession(sessionId);
+            if (!success) {
+                throw new Error(`Session with ID ${sessionId} not found`);
+            }
+
+            return {
+                success: true,
+                message: `Session ${sessionId} deleted successfully`
+            };
+        } catch (error: any) {
+            log.error(`Error deleting LLM session: ${error.message || 'Unknown error'}`);
+            throw new Error(`Failed to delete session: ${error.message || 'Unknown error'}`);
+        }
+    }
+
+    /**
+     * Get all sessions
+     */
+    getSessions() {
+        return SessionsStore.getAllSessions();
+    }
+
+    /**
+     * Create an in-memory session from a Chat Note
+     * This treats the Chat Note as the source of truth, using its ID as the session ID
+     */
+    async createSessionFromChatNote(noteId: string): Promise<ChatSession | null> {
+        try {
+            log.info(`Creating in-memory session for Chat Note ID ${noteId}`);
+
+            // Import chat storage service
+            const chatStorageService = (await import('../../llm/chat_storage_service.js')).default;
+
+            // Try to get the Chat Note data
+            const chatNote = await chatStorageService.getChat(noteId);
+
+            if (!chatNote) {
+                log.error(`Chat Note ${noteId} not found, cannot create session`);
+                return null;
+            }
+
+            log.info(`Found Chat Note ${noteId}, creating in-memory session`);
+
+            // Convert Message[] to ChatMessage[] by ensuring the role is compatible
+            const chatMessages: ChatMessage[] = chatNote.messages.map(msg => ({
+                role: msg.role === 'tool' ? 'assistant' : msg.role, // Map 'tool' role to 'assistant'
+                content: msg.content,
+                timestamp: new Date()
+            }));
+
+            // Create a new session with the same ID as the Chat Note
+            const session: ChatSession = {
+                id: chatNote.id,  // Use Chat Note ID as the session ID
+                title: chatNote.title,
+                messages: chatMessages,
+                createdAt: chatNote.createdAt || new Date(),
+                lastActive: new Date(),
+                metadata: chatNote.metadata || {}
+            };
+
+            // Add the session to the in-memory store
+            SessionsStore.getAllSessions().set(noteId, session);
+
+            log.info(`Successfully created in-memory session for Chat Note ${noteId}`);
+            return session;
+        } catch (error) {
+            log.error(`Failed to create session from Chat Note: ${error}`);
+            return null;
+        }
+    }
+
+    /**
+     * Get an existing session or create a new one from a Chat Note
+     * This treats the Chat Note as the source of truth, using its ID as the session ID
+     */
+    async getOrCreateSessionFromChatNote(noteId: string, createIfNotFound: boolean = true): Promise<ChatSession | null> {
+        // First check if we already have this session in memory
+        let session = SessionsStore.getSession(noteId);
+
+        if (session) {
+            log.info(`Found existing in-memory session for Chat Note ${noteId}`);
+            return session;
+        }
+
+        // If not in memory, try to create from Chat Note
+        log.info(`Session not found in memory for Chat Note ${noteId}, attempting to create it`);
+
+        // Only try to create if allowed
+        if (!createIfNotFound) {
+            log.info(`Not creating new session for ${noteId} as createIfNotFound=false`);
+            return null;
+        }
+
+        // Create from Chat Note
+        return await this.createSessionFromChatNote(noteId);
+    }
+}
+
+// Create singleton instance
+const restChatService = new RestChatService();
+export default restChatService;
diff --git a/src/services/llm/chat/sessions_store.ts b/src/services/llm/chat/sessions_store.ts
new file mode 100644
index 000000000..65715ab23
--- /dev/null
+++ b/src/services/llm/chat/sessions_store.ts
@@ -0,0 +1,169 @@
+/**
+ * In-memory storage for chat sessions
+ */
+import log from "../../log.js";
+import { LLM_CONSTANTS } from '../constants/provider_constants.js';
+import { SEARCH_CONSTANTS } from '../constants/search_constants.js';
+import { randomString } from "../../utils.js";
+import type { ChatSession, ChatMessage } from '../interfaces/chat_session.js';
+
+// In-memory storage for sessions
+const sessions = new Map<string, ChatSession>();
+
+// Flag to track if cleanup timer has been initialized
+let cleanupInitialized = false;
+
+/**
+ * Provides methods to manage chat sessions
+ */
+class SessionsStore {
+    /**
+     * Initialize the session cleanup timer to remove old/inactive sessions
+     */
+    initializeCleanupTimer(): void {
+        if (cleanupInitialized) {
+            return;
+        }
+
+        // Clean sessions that have expired based on the constants
+        function cleanupOldSessions() {
+            const expiryTime = new Date(Date.now() - LLM_CONSTANTS.SESSION.SESSION_EXPIRY_MS);
+            for (const [sessionId, session] of sessions.entries()) {
+                if (session.lastActive < expiryTime) {
+                    sessions.delete(sessionId);
+                }
+            }
+        }
+
+        // Run cleanup at the configured interval
+        setInterval(cleanupOldSessions, LLM_CONSTANTS.SESSION.CLEANUP_INTERVAL_MS);
+        cleanupInitialized = true;
+        log.info("Session cleanup timer initialized");
+    }
+
+    /**
+     * Get all sessions
+     */
+    getAllSessions(): Map<string, ChatSession> {
+        return sessions;
+    }
+
+    /**
+     * Get a specific session by ID
+     */
+    getSession(sessionId: string): ChatSession | undefined {
+        return sessions.get(sessionId);
+    }
+
+    /**
+     * Create a new session
+     */
+    createSession(options: {
+        chatNoteId: string;
+        title?: string;
+        systemPrompt?: string;
+        contextNoteId?: string;
+        maxTokens?: number;
+        model?: string;
+        provider?: string;
+        temperature?: number;
+    }): ChatSession {
+        this.initializeCleanupTimer();
+
+        const title = options.title || 'Chat Session';
+        const sessionId = options.chatNoteId;
+        const now = new Date();
+
+        // Initial system message if provided
+        const messages: ChatMessage[] = [];
+        if (options.systemPrompt) {
+            messages.push({
+                role: 'system',
+                content: options.systemPrompt,
+                timestamp: now
+            });
+        }
+
+        // Create and store the session
+        const session: ChatSession = {
+            id: sessionId,
+            title,
+            messages,
+            createdAt: now,
+            lastActive: now,
+            noteContext: options.contextNoteId,
+            metadata: {
+                temperature: options.temperature || SEARCH_CONSTANTS.TEMPERATURE.DEFAULT,
+                maxTokens: options.maxTokens,
+                model: options.model,
+                provider: options.provider,
+                sources: [],
+                toolExecutions: [],
+                lastUpdated: now.toISOString()
+            }
+        };
+
+        sessions.set(sessionId, session);
+        log.info(`Created in-memory session for Chat Note ID: ${sessionId}`);
+
+        return session;
+    }
+
+    /**
+     * Update a session's last active timestamp
+     */
+    touchSession(sessionId: string): boolean {
+        const session = sessions.get(sessionId);
+        if (!session) {
+            return false;
+        }
+
+        session.lastActive = new Date();
+        return true;
+    }
+
+    /**
+     * Delete a session
+     */
+    deleteSession(sessionId: string): boolean {
+        return sessions.delete(sessionId);
+    }
+
+    /**
+     * Record a tool execution in the session metadata
+     */
+    recordToolExecution(chatNoteId: string, tool: any, result: string, error?: string): void {
+        if (!chatNoteId) return;
+
+        const session = sessions.get(chatNoteId);
+        if (!session) return;
+
+        try {
+            const toolExecutions = session.metadata.toolExecutions || [];
+
+            // Format tool execution record
+            const execution = {
+                id: tool.id || `tool-${Date.now()}-${Math.random().toString(36).substring(2, 7)}`,
+                name: tool.function?.name || 'unknown',
+                arguments: typeof tool.function?.arguments === 'string'
+                    ? (() => { try { return JSON.parse(tool.function.arguments); } catch { return tool.function.arguments; } })()
+                    : tool.function?.arguments || {},
+                result: result,
+                error: error,
+                timestamp: new Date().toISOString()
+            };
+
+            // Add to tool executions
+            toolExecutions.push(execution);
+            session.metadata.toolExecutions = toolExecutions;
+
+            log.info(`Recorded tool execution for ${execution.name} in session ${chatNoteId}`);
+        } catch (err) {
+            log.error(`Failed to record tool execution: ${err}`);
+        }
+    }
+}
+
+// Create singleton instance
+const sessionsStore = new SessionsStore();
+export default sessionsStore;
diff --git a/src/services/llm/chat/utils/message_formatter.ts b/src/services/llm/chat/utils/message_formatter.ts
new file mode 100644
index 000000000..30ac9a7da
--- /dev/null
+++ b/src/services/llm/chat/utils/message_formatter.ts
@@ -0,0 +1,121 @@
+/**
+ * Message formatting utilities for different LLM providers
+ */
+import type { Message } from "../../ai_interface.js";
+
+/**
+ * Interface for message formatters
+ */
+interface MessageFormatter {
+    formatMessages(messages: Message[], systemPrompt?: string, context?: string): Message[];
+}
+
+/**
+ * Factory to get the appropriate message formatter for a given provider
+ */
+export function getFormatter(providerName: string): MessageFormatter {
+    // Currently we use a simple implementation that works for most providers
+    // In the future, this could be expanded to have provider-specific formatters
+    return {
+        formatMessages(messages: Message[], systemPrompt?: string, context?: string): Message[] {
+            // Simple implementation that works for most providers
+            const formattedMessages: Message[] = [];
+
+            // Add system message if context or systemPrompt is provided
+            if (context || systemPrompt) {
+                formattedMessages.push({
+                    role: 'system',
+                    content: systemPrompt || (context ? `Use the following context to answer the query: ${context}` : '')
+                });
+            }
+
+            // Add all other messages
+            for (const message of messages) {
+                if (message.role === 'system' && formattedMessages.some(m => m.role === 'system')) {
+                    // Skip duplicate system messages
+                    continue;
+                }
+                formattedMessages.push(message);
+            }
+
+            return formattedMessages;
+        }
+    };
+}
+
+/**
+ * Build messages with context for a specific LLM provider
+ */
+export async function buildMessagesWithContext(
+    messages: Message[],
+    context: string,
+    llmService: any
+): Promise<Message[]> {
+    try {
+        if (!messages || messages.length === 0) {
+            return [];
+        }
+
+        if (!context || context.trim() === '') {
+            return messages;
+        }
+
+        // Get the provider name, handling service classes and raw provider names
+        let providerName: string;
+        if (typeof llmService === 'string') {
+            // If llmService is a string, assume it's the provider name
+            providerName = llmService;
+        } else if (llmService.constructor && llmService.constructor.name) {
+            // Extract provider name from service class name (e.g., OllamaService -> ollama)
+            providerName = llmService.constructor.name.replace('Service', '').toLowerCase();
+        } else {
+            // Fallback to default
+            providerName = 'default';
+        }
+
+        // Get the appropriate formatter for this provider
+        const formatter = getFormatter(providerName);
+
+        // Format messages with context using the provider-specific formatter
+        const formattedMessages = formatter.formatMessages(
+            messages,
+            undefined, // No system prompt override - use what's in the messages
+            context
+        );
+
+        return formattedMessages;
+    } catch (error) {
+        console.error(`Error building messages with context: ${error}`);
+        // Fallback to original messages in case of error
+        return messages;
+    }
+}
+
+/**
+ * Build context from a list of note sources and a query
+ */
+export function buildContextFromNotes(sources: any[], query: string): string {
+    if (!sources || sources.length === 0) {
+        return query || '';
+    }
+
+    const noteContexts = sources
+        .filter(source => source.content) // Only include sources with content
+        .map((source) => {
+            // Format each note with its title as a natural heading and wrap in <note> tags
+            return `<note>\n### ${source.title}\n${source.content || 'No content available'}\n</note>`;
+        })
+        .join('\n\n');
+
+    if (!noteContexts) {
+        return query || '';
+    }
+
+    // Import the CONTEXT_PROMPTS constant
+    const { CONTEXT_PROMPTS } = require('../../constants/llm_prompt_constants.js');
+
+    // Use the template from the constants file, replacing placeholders
+    return CONTEXT_PROMPTS.CONTEXT_NOTES_WRAPPER
+        .replace('{noteContexts}', noteContexts)
+        .replace('{query}', query);
+}
diff --git a/src/services/llm/chat_service.ts b/src/services/llm/chat_service.ts
new file mode 100644
index 000000000..18bf01251
--- /dev/null
+++ b/src/services/llm/chat_service.ts
@@ -0,0 +1,595 @@
+import type { Message, ChatCompletionOptions, ChatResponse } from './ai_interface.js';
+import chatStorageService from './chat_storage_service.js';
+import log from '../log.js';
+import { CONTEXT_PROMPTS, ERROR_PROMPTS } from './constants/llm_prompt_constants.js';
+import { ChatPipeline } from './pipeline/chat_pipeline.js';
+import type { ChatPipelineConfig, StreamCallback } from './pipeline/interfaces.js';
+import aiServiceManager from './ai_service_manager.js';
+import type { ChatPipelineInput } from './pipeline/interfaces.js';
+import type { NoteSearchResult } from './interfaces/context_interfaces.js';
+
+// Update the ChatCompletionOptions interface to include the missing properties
+declare module './ai_interface.js' {
+    interface ChatCompletionOptions {
+        pipeline?: string;
+        noteId?: string;
+        useAdvancedContext?: boolean;
+        showThinking?: boolean;
+        enableTools?: boolean;
+    }
+}
+
+// Add a type for context extraction result
+interface ContextExtractionResult {
+    context: string;
+    sources?: NoteSearchResult[];
+    thinking?: string;
+}
+
+export interface ChatSession {
+    id: string;
+    title: string;
+    messages: Message[];
+    isStreaming?: boolean;
+    options?: ChatCompletionOptions;
+}
+
+/**
+ * Chat pipeline configurations for different use cases
+ */
+const PIPELINE_CONFIGS: Record<string, Partial<ChatPipelineConfig>> = {
+    default: {
+        enableStreaming: true,
+        enableMetrics: true
+    },
+    agent: {
+        enableStreaming: true,
+        enableMetrics: true,
+        maxToolCallIterations: 5
+    },
+    performance: {
+        enableStreaming: false,
+        enableMetrics: true
+    }
+};
+
+/**
+ * Service for managing chat interactions and history
+ */
+export class ChatService {
+    private sessionCache: Map<string, ChatSession> = new Map();
+    private pipelines: Map<string, ChatPipeline> = new Map();
+
+    constructor() {
+        // Initialize pipelines
+        Object.entries(PIPELINE_CONFIGS).forEach(([name, config]) => {
+            this.pipelines.set(name, new ChatPipeline(config));
+        });
+    }
+
+    /**
+     * Get a pipeline by name, or the default one
+     */
+    private getPipeline(name: string = 'default'): ChatPipeline {
+        return this.pipelines.get(name) || this.pipelines.get('default')!;
+    }
+
+    /**
+     * Create a new chat session
+     */
+    async createSession(title?: string, initialMessages: Message[] = []): Promise<ChatSession> {
+        // Create a new Chat Note as the source of truth
+        const chat = await chatStorageService.createChat(title || 'New Chat', initialMessages);
+
+        const session: ChatSession = {
+            id: chat.id,
+            title: chat.title,
+            messages: chat.messages,
+            isStreaming: false
+        };
+
+        // Session is just a cache now
+        this.sessionCache.set(chat.id, session);
+        return session;
+    }
+
+    /**
+     * Get an existing session or create a new one
+     */
+    async getOrCreateSession(sessionId?: string): Promise<ChatSession> {
+        if (sessionId) {
+            // First check the cache
+            const cachedSession = this.sessionCache.get(sessionId);
+            if (cachedSession) {
+                // Refresh the data from the source of truth
+                const chat = await chatStorageService.getChat(sessionId);
+                if (chat) {
+                    // Update the cached session with latest data from the note
+                    cachedSession.title = chat.title;
+                    cachedSession.messages = chat.messages;
+                    return cachedSession;
+                }
+            } else {
+                // Not in cache, load from the chat note
+                const chat = await chatStorageService.getChat(sessionId);
+                if (chat) {
+                    const session: ChatSession = {
+                        id: chat.id,
+                        title: chat.title,
+                        messages: chat.messages,
+                        isStreaming: false
+                    };
+
+                    this.sessionCache.set(chat.id, session);
+                    return session;
+                }
+            }
+        }
+
+        return this.createSession();
+    }
+
+    /**
+     * Send a message in a chat session and get the AI response
+     */
+    async sendMessage(
+        sessionId: string,
+        content: string,
+        options?: ChatCompletionOptions,
+        streamCallback?: StreamCallback
+    ): Promise<ChatSession> {
+        const session = await this.getOrCreateSession(sessionId);
+
+        // Add user message
+        const userMessage: Message = {
+            role: 'user',
+            content
+        };
+
+        session.messages.push(userMessage);
+        session.isStreaming = true;
+
+        try {
+            // Immediately save the user message
+            await chatStorageService.updateChat(session.id, session.messages);
+
+            // Log message processing
+            log.info(`Processing message: "${content.substring(0, 100)}..."`);
+
+            // Select pipeline to use
+            const pipeline = this.getPipeline();
+
+            // Include sessionId in the options for tool execution tracking
+            const pipelineOptions = {
+                ...(options || session.options || {}),
+                sessionId: session.id
+            };
+
+            // Execute the pipeline
+            const response = await pipeline.execute({
+                messages: session.messages,
+                options: pipelineOptions,
+                query: content,
+                streamCallback
+            });
+
+            // Add assistant message
+            const assistantMessage: Message = {
+                role: 'assistant',
+                content: response.text,
+                tool_calls: response.tool_calls
+            };
+
+            session.messages.push(assistantMessage);
+            session.isStreaming = false;
+
+            // Save metadata about the response
+            const metadata = {
+                model: response.model,
+                provider: response.provider,
+                usage: response.usage
+            };
+
+            // If there are tool calls, make sure they're stored in metadata
+            if (response.tool_calls && response.tool_calls.length > 0) {
+                // Let the storage service extract and save tool executions
+                // The tool results are already in the messages
+            }
+
+            // Save the complete conversation with metadata
+            await chatStorageService.updateChat(session.id, session.messages, undefined, metadata);
+
+            // If first message, update the title based on content
+            if (session.messages.length <= 2 && (!session.title || session.title === 'New Chat')) {
+                const title = this.generateTitleFromMessages(session.messages);
+                session.title = title;
+                await chatStorageService.updateChat(session.id, session.messages, title);
+            }
+
+            return session;
+
+        } catch (error: unknown) {
+            session.isStreaming = false;
+            console.error('Error in AI chat:', this.handleError(error));
+
+            // Add error message
+            const errorMessage: Message = {
+                role: 'assistant',
+                content: ERROR_PROMPTS.USER_ERRORS.GENERAL_ERROR
+            };
+
+            session.messages.push(errorMessage);
+
+            // Save the conversation with error
+            await chatStorageService.updateChat(session.id, session.messages);
+
+            // Notify streaming error if callback provided
+            if (streamCallback) {
+                streamCallback(errorMessage.content, true);
+            }
+
+            return session;
+        }
+    }
+
+    /**
+     * Send a message with context from a specific note
+     */
+    async sendContextAwareMessage(
+        sessionId: string,
+        content: string,
+        noteId: string,
+        options?: ChatCompletionOptions,
+        streamCallback?: StreamCallback
+    ): Promise<ChatSession> {
+        const session = await this.getOrCreateSession(sessionId);
+
+        // Add user message
+        const userMessage: Message = {
+            role: 'user',
+            content
+        };
+
+        session.messages.push(userMessage);
+        session.isStreaming = true;
+
+        try {
+            // Immediately save the user message
+            await chatStorageService.updateChat(session.id, session.messages);
+
+            // Log message processing
+            log.info(`Processing context-aware message: "${content.substring(0, 100)}..."`);
+            log.info(`Using context from note: ${noteId}`);
+
+            // Get showThinking option if it exists
+            const showThinking = options?.showThinking === true;
+
+            // Select appropriate pipeline based on whether agent tools are needed
+            const pipelineType = showThinking ? 'agent' : 'default';
+            const pipeline = this.getPipeline(pipelineType);
+
+            // Include sessionId in the options for tool execution tracking
+            const pipelineOptions = {
+                ...(options || session.options || {}),
+                sessionId: session.id
+            };
+
+            // Execute the pipeline with note context
+            const response = await pipeline.execute({
+                messages: session.messages,
+                options: pipelineOptions,
+                noteId,
+                query: content,
+                showThinking,
+                streamCallback
+            });
+
+            // Add assistant message
+            const assistantMessage: Message = {
+                role: 'assistant',
+                content: response.text,
+                tool_calls: response.tool_calls
+            };
+
+            session.messages.push(assistantMessage);
+            session.isStreaming = false;
+
+            // Save metadata about the response
+            const metadata = {
+                model: response.model,
+                provider: response.provider,
+                usage: response.usage,
+                contextNoteId: noteId // Store the note ID used for context
+            };
+
+            // If there are tool calls, make sure they're stored in metadata
+            if (response.tool_calls && response.tool_calls.length > 0) {
+                // Let the storage service extract and save tool executions
+                // The tool results are already in the messages
+            }
+
+            // Save the complete conversation with metadata to the Chat Note (the single source of truth)
+            await chatStorageService.updateChat(session.id, session.messages, undefined, metadata);
+
+            // If first message, update the title
+            if (session.messages.length <= 2 && (!session.title || session.title === 'New Chat')) {
+                const title = this.generateTitleFromMessages(session.messages);
+                session.title = title;
+                await chatStorageService.updateChat(session.id, session.messages, title);
+            }
+
+            return session;
+
+        } catch (error: unknown) {
+            session.isStreaming = false;
+            console.error('Error in context-aware chat:', this.handleError(error));
+
+            // Add error message
+            const errorMessage: Message = {
+                role: 'assistant',
+                content: ERROR_PROMPTS.USER_ERRORS.CONTEXT_ERROR
+            };
+
+            session.messages.push(errorMessage);
+
+            // Save the conversation with error to the Chat Note
+            await chatStorageService.updateChat(session.id, session.messages);
+
+            // Notify streaming error if callback provided
+            if (streamCallback) {
+                streamCallback(errorMessage.content, true);
+            }
+
+            return session;
+        }
+    }
+
+    /**
+     * Add context from the current note to the chat
+     *
+     * @param sessionId - The ID of the chat session
+     * @param noteId - The ID of the note to add context from
+     * @param useSmartContext - Whether to use smart context extraction (default: true)
+     * @returns The updated chat session
+     */
+    async addNoteContext(sessionId: string, noteId: string, useSmartContext = true): Promise<ChatSession> {
+        const session = await this.getOrCreateSession(sessionId);
+
+        // Get the last user message to use as context for semantic search
+        const lastUserMessage = [...session.messages].reverse()
+            .find(msg => msg.role === 'user' && msg.content.length > 10)?.content || '';
+
+        // Use the context extraction stage from the pipeline
+        const pipeline = this.getPipeline();
+        const contextResult = await pipeline.stages.contextExtraction.execute({
+            noteId,
+            query: lastUserMessage,
+            useSmartContext
+        }) as ContextExtractionResult;
+
+        const contextMessage: Message = {
+            role: 'user',
+            content: CONTEXT_PROMPTS.NOTE_CONTEXT_PROMPT.replace('{context}', contextResult.context)
+        };
+
+        session.messages.push(contextMessage);
+
+        // Store the context note id in metadata
+        const metadata = {
+            contextNoteId: noteId
+        };
+
+        // Check if the context extraction result has sources
+        if (contextResult.sources && contextResult.sources.length > 0) {
+            // Convert the sources to match expected format (handling null vs undefined)
+            const sources = contextResult.sources.map(source => ({
+                noteId: source.noteId,
+                title: source.title,
+                similarity: source.similarity,
+                // Replace null with undefined for content
+                content: source.content === null ? undefined : source.content
+            }));
+
+            // Store these sources in metadata
+            await chatStorageService.recordSources(session.id, sources);
+        }
+
+        await chatStorageService.updateChat(session.id, session.messages, undefined, metadata);
+
+        return session;
+    }
+
+    /**
+     * Add semantically relevant context from a note based on a specific query
+     */
+    async addSemanticNoteContext(sessionId: string, noteId: string, query: string): Promise<ChatSession> {
+        const session = await this.getOrCreateSession(sessionId);
+
+        // Use the semantic context extraction stage from the pipeline
+        const pipeline = this.getPipeline();
+        const contextResult = await pipeline.stages.semanticContextExtraction.execute({
+            noteId,
+            query
+        });
+
+        const contextMessage: Message = {
+            role: 'user',
+            content: CONTEXT_PROMPTS.SEMANTIC_NOTE_CONTEXT_PROMPT
+                .replace('{query}', query)
+                .replace('{context}', contextResult.context)
+        };
+
+        session.messages.push(contextMessage);
+
+        // Store the context note id and query in metadata
+        const metadata = {
+            contextNoteId: noteId
+        };
+
+        // Check if the semantic context extraction result has sources
+        const contextSources = (contextResult as ContextExtractionResult).sources || [];
+        if (contextSources && contextSources.length > 0) {
+            // Convert the sources to the format expected by recordSources
+            const sources = contextSources.map((source) => ({
+                noteId: source.noteId,
+                title: source.title,
+                similarity: source.similarity,
+                content: source.content === null ? undefined : source.content
+            }));
+
+            // Store these sources in metadata
+            await chatStorageService.recordSources(session.id, sources);
+        }
+
+        await chatStorageService.updateChat(session.id, session.messages, undefined, metadata);
+
+        return session;
+    }
+
+    /**
+     * Get all user's chat sessions
+     */
+    async getAllSessions(): Promise<ChatSession[]> {
+        // Always fetch the latest data from notes
+        const chats = await chatStorageService.getAllChats();
+
+        // Update the cache with the latest data
+        return chats.map(chat => {
+            const cachedSession = this.sessionCache.get(chat.id);
+
+            const session: ChatSession = {
+                id: chat.id,
+                title: chat.title,
+                messages: chat.messages,
+                isStreaming: cachedSession?.isStreaming || false
+            };
+
+            // Update the cache
+            if (cachedSession) {
+                cachedSession.title = chat.title;
+                cachedSession.messages = chat.messages;
+            } else {
+                this.sessionCache.set(chat.id, session);
+            }
+
+            return session;
+        });
+    }
+
+    /**
+     * Delete a chat session
+     */
+    async deleteSession(sessionId: string): Promise<boolean> {
+        this.sessionCache.delete(sessionId);
+        return chatStorageService.deleteChat(sessionId);
+    }
+
+    /**
+     * Get pipeline performance metrics
+     */
+    getPipelineMetrics(pipelineType: string = 'default'): unknown {
+        const pipeline = this.getPipeline(pipelineType);
+        return pipeline.getMetrics();
+    }
+
+    /**
+     * Reset pipeline metrics
+     */
+    resetPipelineMetrics(pipelineType: string = 'default'): void {
+        const pipeline = this.getPipeline(pipelineType);
+        pipeline.resetMetrics();
+    }
+
+    /**
+     * Generate a title from the first messages in a conversation
+     */
+    private generateTitleFromMessages(messages: Message[]): string {
+        if (messages.length < 2) {
+            return 'New Chat';
+        }
+
+        // Get the first user message
+        const firstUserMessage = messages.find(m => m.role === 'user');
+        if (!firstUserMessage) {
+            return 'New Chat';
+        }
+
+        // Extract first line or first few words
+        const firstLine = firstUserMessage.content.split('\n')[0].trim();
+
+        if (firstLine.length <= 30) {
+            return firstLine;
+        }
+
+        // Take first 30 chars if too long
+        return firstLine.substring(0, 27) + '...';
+    }
+
+    /**
+     * Generate a chat completion with a sequence of messages
+     * @param messages Messages array to send to the AI provider
+     * @param options Chat completion options
+     */
+    async generateChatCompletion(messages: Message[], options: ChatCompletionOptions = {}): Promise<ChatResponse> {
+        log.info(`========== CHAT SERVICE FLOW CHECK ==========`);
+        log.info(`Entered generateChatCompletion in ChatService`);
+        log.info(`Using pipeline for chat completion: ${this.getPipeline(options.pipeline).constructor.name}`);
+        log.info(`Tool support enabled: ${options.enableTools !== false}`);
+
+        try {
+            // Get AI service
+            const service = await aiServiceManager.getService();
+            if (!service) {
+                throw new Error('No AI service available');
+            }
+
+            log.info(`Using AI service: ${service.getName()}`);
+
+            // Prepare query extraction
+            const lastUserMessage = [...messages].reverse().find(m => m.role === 'user');
+            const query = lastUserMessage ? lastUserMessage.content : undefined;
+
+            // For advanced context processing, use the pipeline
+            if (options.useAdvancedContext && query) {
+                log.info(`Using chat pipeline for advanced context with query: ${query.substring(0, 50)}...`);
+
+                // Create a pipeline input with the query and messages
+                const pipelineInput: ChatPipelineInput = {
+                    messages,
+                    options,
+                    query,
+                    noteId: options.noteId
+                };
+
+                // Execute the pipeline
+                const pipeline = this.getPipeline(options.pipeline);
+                const response = await pipeline.execute(pipelineInput);
+                log.info(`Pipeline execution complete, response contains tools: ${response.tool_calls ? 'yes' : 'no'}`);
+                if (response.tool_calls) {
+                    log.info(`Tool calls in pipeline response: ${response.tool_calls.length}`);
+                }
+                return response;
+            }
+
+            // If not using advanced context, use direct service call
+            return await service.generateChatCompletion(messages, options);
+        } catch (error: unknown) {
+            console.error('Error in generateChatCompletion:', error);
+            throw error;
+        }
+    }
+
+    /**
+     * Error handler utility
+     */
+    private handleError(error: unknown): string {
+        if (error instanceof Error) {
+            return error.message || String(error);
+        }
+        return String(error);
+    }
+}
+
+// Singleton instance
+const chatService = new ChatService();
+export default chatService;
diff --git a/src/services/llm/chat_storage_service.ts b/src/services/llm/chat_storage_service.ts
new file mode 100644
index 000000000..578f75ab7
--- /dev/null
+++ b/src/services/llm/chat_storage_service.ts
@@ -0,0 +1,451 @@
+import notes from '../notes.js';
+import sql from '../sql.js';
+import attributes from '../attributes.js';
+import type { Message } from './ai_interface.js';
+import type { ToolCall } from './tools/tool_interfaces.js';
+import { t } from 'i18next';
+import log from '../log.js';
+
+interface StoredChat {
+    id: string;
+    title: string;
+    messages: Message[];
+    noteId?: string;
+    createdAt: Date;
+    updatedAt: Date;
+    metadata?: ChatMetadata;
+}
+
+interface ChatMetadata {
+    sources?: Array<{
+        noteId: string;
+        title: string;
+        similarity?: number;
+        path?: string;
+        branchId?: string;
+        content?: string;
+    }>;
+    model?: string;
+    provider?: string;
+    contextNoteId?: string;
+    toolExecutions?: Array<ToolExecution>;
+    usage?: {
+        promptTokens?: number;
+        completionTokens?: number;
+        totalTokens?: number;
+    };
+    temperature?: number;
+    maxTokens?: number;
+}
+
+interface ToolExecution {
+    id: string;
+    name: string;
+    arguments: Record<string, any> | string;
+    result: string | Record<string, any>;
+    error?: string;
+    timestamp: Date;
+    executionTime?: number;
+}
+
+/**
+ * Service for storing and retrieving chat histories
+ * Chats are stored as a special type of note
+ */
+export class ChatStorageService {
+    private static readonly CHAT_LABEL = 'triliumChat';
+    private static readonly CHAT_ROOT_LABEL = 'triliumChatRoot';
+    private static readonly CHAT_TYPE = 'code';
+    private static readonly CHAT_MIME = 'application/json';
+
+    /**
+     * Get or create the root note for all chats
+     */
+    async getOrCreateChatRoot(): Promise<string> {
+        const existingRoot = await sql.getRow<{noteId: string}>(
+            `SELECT noteId FROM attributes WHERE name = ? AND value = ?`,
+            ['label', ChatStorageService.CHAT_ROOT_LABEL]
+        );
+
+        if (existingRoot) {
+            return existingRoot.noteId;
+        }
+
+        // Create root note for chats
+        const { note } = notes.createNewNote({
+            parentNoteId: 'root',
+            title: t('ai.chat.root_note_title'),
+            type: 'text',
+            content: t('ai.chat.root_note_content')
+        });
+
+        attributes.createLabel(
+            note.noteId,
+            ChatStorageService.CHAT_ROOT_LABEL,
+            ''
+        );
+
+        return note.noteId;
+    }
+
+    /**
+     * Create a new chat
+     */
+    async createChat(title: string, messages: Message[] = [], metadata?: ChatMetadata): Promise<StoredChat> {
+        const rootNoteId = await this.getOrCreateChatRoot();
+        const now = new Date();
+
+        const { note } = notes.createNewNote({
+            parentNoteId: rootNoteId,
+            title: title || t('ai.chat.new_chat_title') + ' ' + now.toLocaleString(),
+            type: ChatStorageService.CHAT_TYPE,
+            mime: ChatStorageService.CHAT_MIME,
+            content: JSON.stringify({
+                messages,
+                metadata: metadata || {},
+                createdAt: now,
+                updatedAt: now
+            }, null, 2)
+        });
+
+        attributes.createLabel(
+            note.noteId,
+            ChatStorageService.CHAT_LABEL,
+            ''
+        );
+
+        return {
+            id: note.noteId,
+            title: title || t('ai.chat.new_chat_title') + ' ' + now.toLocaleString(),
+            messages,
+            noteId: note.noteId,
+            createdAt: now,
+            updatedAt: now,
+            metadata: metadata || {}
+        };
+    }
+
+    /**
+     * Get all chats
+     */
+    async getAllChats(): Promise<StoredChat[]> {
+        const chats = await sql.getRows<{noteId: string, title: string, dateCreated: string, dateModified: string, content: string}>(
+            `SELECT notes.noteId, notes.title, notes.dateCreated, notes.dateModified, blobs.content
+             FROM notes
+             JOIN blobs ON notes.blobId = blobs.blobId
+             JOIN attributes ON notes.noteId = attributes.noteId
+             WHERE attributes.name = ? AND attributes.value = ?
+             ORDER BY notes.dateModified DESC`,
+            ['label', ChatStorageService.CHAT_LABEL]
+        );
+
+        return chats.map(chat => {
+            let messages: Message[] = [];
+            let metadata: ChatMetadata = {};
+            let createdAt = new Date(chat.dateCreated);
+            let updatedAt = new Date(chat.dateModified);
+
+            try {
+                const content = JSON.parse(chat.content);
+                messages = content.messages || [];
+                metadata = content.metadata || {};
+
+                // Use stored dates if available
+                if (content.createdAt) {
+                    createdAt = new Date(content.createdAt);
+                }
+                if (content.updatedAt) {
+                    updatedAt = new Date(content.updatedAt);
+                }
+            } catch (e) {
+                console.error('Failed to parse chat content:', e);
+            }
+
+            return {
+                id: chat.noteId,
+                title: chat.title,
+                messages,
+                noteId: chat.noteId,
+                createdAt,
+                updatedAt,
+                metadata
+            };
+        });
+    }
+
+    /**
+     * Get a specific chat
+     */
+    async getChat(chatId: string): Promise<StoredChat | null> {
+        const chat = await sql.getRow<{noteId: string, title: string, dateCreated: string, dateModified: string, content: string}>(
+            `SELECT notes.noteId, notes.title, notes.dateCreated, notes.dateModified, blobs.content
+             FROM notes
+             JOIN blobs ON notes.blobId = blobs.blobId
+             WHERE notes.noteId = ?`,
+            [chatId]
+        );
+
+        if (!chat) {
+            return null;
+        }
+
+        let messages: Message[] = [];
+        let metadata: ChatMetadata = {};
+        let createdAt = new Date(chat.dateCreated);
+        let updatedAt = new Date(chat.dateModified);
+
+        try {
+            const content = JSON.parse(chat.content);
+            messages = content.messages || [];
+            metadata = content.metadata || {};
+
+            // Use stored dates if available
+            if (content.createdAt) {
+                createdAt = new Date(content.createdAt);
+            }
+            if (content.updatedAt) {
+                updatedAt = new Date(content.updatedAt);
+            }
+        } catch (e) {
+            console.error('Failed to parse chat content:', e);
+        }
+
+        return {
+            id: chat.noteId,
+            title: chat.title,
+            messages,
+            noteId: chat.noteId,
+            createdAt,
+            updatedAt,
+            metadata
+        };
+    }
+
+    /**
+     * Update messages in a chat
+     */
+    async updateChat(
+        chatId: string,
+        messages: Message[],
+        title?: string,
+        metadata?: ChatMetadata
+    ): Promise<StoredChat | null> {
+        const chat = await this.getChat(chatId);
+
+        if (!chat) {
+            return null;
+        }
+
+        const now = new Date();
+        const updatedMetadata = {...(chat.metadata || {}), ...(metadata || {})};
+
+        // Extract and store tool calls from the messages
+        const toolExecutions = this.extractToolExecutionsFromMessages(messages, updatedMetadata.toolExecutions || []);
+        if (toolExecutions.length > 0) {
+            updatedMetadata.toolExecutions = toolExecutions;
+        }
+
+        // Update content directly using SQL since we don't have a method for this in the notes service
+        await sql.execute(
+            `UPDATE blobs SET content = ? WHERE blobId = (SELECT blobId FROM notes WHERE noteId = ?)`,
+            [JSON.stringify({
+                messages,
+                metadata: updatedMetadata,
+                createdAt: chat.createdAt,
+                updatedAt: now
+            }, null, 2), chatId]
+        );
+
+        // Update title if provided
+        if (title && title !== chat.title) {
+            await sql.execute(
+                `UPDATE notes SET title = ? WHERE noteId = ?`,
+                [title, chatId]
+            );
+        }
+
+        return {
+            ...chat,
+            title: title || chat.title,
+            messages,
+            updatedAt: now,
+            metadata: updatedMetadata
+        };
+    }
+
+    /**
+     * Delete a chat
+     */
+    async deleteChat(chatId: string): Promise<boolean> {
+        try {
+            // Mark note as deleted using SQL since we don't have deleteNote in the exports
+            await sql.execute(
+                `UPDATE notes SET isDeleted = 1 WHERE noteId = ?`,
+                [chatId]
+            );
+
+            return true;
+        } catch (e) {
+            console.error('Failed to delete chat:', e);
+            return false;
+        }
+    }
+
+    /**
+     * Record a new tool execution
+     */
+    async recordToolExecution(
+        chatId: string,
+        toolName: string,
+        toolId: string,
+        args: Record<string, any> | string,
+        result: string | Record<string, any>,
+        error?: string
+    ): Promise<boolean> {
+        try {
+            const chat = await this.getChat(chatId);
+            if (!chat) return false;
+
+            const toolExecution: ToolExecution = {
+                id: toolId,
+                name: toolName,
+                arguments: args,
+                result,
+                error,
+                timestamp: new Date(),
+                executionTime: 0 // Could track this if we passed in a start time
+            };
+
+            const currentToolExecutions = chat.metadata?.toolExecutions || [];
+            currentToolExecutions.push(toolExecution);
+
+            await this.updateChat(
+                chatId,
+                chat.messages,
+                undefined, // Don't change title
+                {
+                    ...chat.metadata,
+                    toolExecutions: currentToolExecutions
+                }
+            );
+
+            return true;
+        } catch (e) {
+            log.error(`Failed to record tool execution: ${e}`);
+            return false;
+        }
+    }
+
+    /**
+     * Extract tool executions from messages
+     * This helps maintain a record of all tool calls even if messages are truncated
+     */
+    private extractToolExecutionsFromMessages(
+        messages: Message[],
+        existingToolExecutions: ToolExecution[] = []
+    ): ToolExecution[] {
+        const toolExecutions = [...existingToolExecutions];
+        const executedToolIds = new Set(existingToolExecutions.map(t => t.id));
+
+        // Process all messages to find tool calls and their results
+        const assistantMessages = messages.filter(msg => msg.role === 'assistant' && msg.tool_calls);
+        const toolMessages = messages.filter(msg => msg.role === 'tool');
+
+        // Create a map of tool responses by tool_call_id
+        const toolResponseMap = new Map<string, string>();
+        for (const toolMsg of toolMessages) {
+            if (toolMsg.tool_call_id) {
+                toolResponseMap.set(toolMsg.tool_call_id, toolMsg.content);
+            }
+        }
+
+        // Extract all tool calls and pair with responses
+        for (const assistantMsg of assistantMessages) {
+            if (!assistantMsg.tool_calls || !Array.isArray(assistantMsg.tool_calls)) continue;
+
+            for (const toolCall of assistantMsg.tool_calls as ToolCall[]) {
+                if (!toolCall.id || executedToolIds.has(toolCall.id)) continue;
+
+                const toolResponse = toolResponseMap.get(toolCall.id);
+                if (!toolResponse) continue; // Skip if no response found
+
+                // We found a tool call with a response, record it
+                let args: Record<string, any> | string;
+                if (typeof toolCall.function.arguments === 'string') {
+                    try {
+                        args = JSON.parse(toolCall.function.arguments);
+                    } catch (e) {
+                        args = toolCall.function.arguments;
+                    }
+                } else {
+                    args = toolCall.function.arguments;
+                }
+
+                let result: string | Record<string, any> = toolResponse;
+                try {
+                    // Try to parse result as JSON if it starts with { or [
+                    if (toolResponse.trim().startsWith('{') || toolResponse.trim().startsWith('[')) {
+                        result = JSON.parse(toolResponse);
+                    }
+                } catch (e) {
+                    // Keep as string if parsing fails
+                    result = toolResponse;
+                }
+
+                const isError = toolResponse.startsWith('Error:');
+                const toolExecution: ToolExecution = {
+                    id: toolCall.id,
+                    name: toolCall.function.name,
+                    arguments: args,
+                    result,
+                    error: isError ? toolResponse.substring('Error:'.length).trim() : undefined,
+                    timestamp: new Date()
+                };
+
+                toolExecutions.push(toolExecution);
+                executedToolIds.add(toolCall.id);
+            }
+        }
+
+        return toolExecutions;
+    }
+
+    /**
+     * Store sources used in a chat
+     */
+    async recordSources(
+        chatId: string,
+        sources: Array<{
+            noteId: string;
+            title: string;
+            similarity?: number;
+            path?: string;
+            branchId?: string;
+            content?: string;
+        }>
+    ): Promise<boolean> {
+        try {
+            const chat = await this.getChat(chatId);
+            if (!chat) return false;
+
+            await this.updateChat(
+                chatId,
+                chat.messages,
+                undefined, // Don't change title
+                {
+                    ...chat.metadata,
+                    sources
+                }
+            );
+
+            return true;
+        } catch (e) {
+            log.error(`Failed to record sources: ${e}`);
+            return false;
+        }
+    }
+}
+
+// Singleton instance
+const chatStorageService = new ChatStorageService();
+export default chatStorageService;
diff --git a/src/services/llm/constants/embedding_constants.ts b/src/services/llm/constants/embedding_constants.ts
new file mode 100644
index 000000000..07d3f83a3
--- /dev/null
+++ b/src/services/llm/constants/embedding_constants.ts
@@ -0,0 +1,9 @@
+export const EMBEDDING_CONSTANTS = {
+    exactTitleMatch: 0.3,
+    titleContainsQuery: 0.2,
+    partialTitleMatch: 0.1,
+    sameType: 0.05,
+    attributeMatch: 0.05,
+    recentlyCreated: 0.05,
+    recentlyModified: 0.05
+};
diff --git a/src/services/llm/constants/formatter_constants.ts b/src/services/llm/constants/formatter_constants.ts
new file mode 100644
index 000000000..d0e745c1c
--- /dev/null
+++ b/src/services/llm/constants/formatter_constants.ts
@@ -0,0 +1,203 @@
+/**
+ * Formatter Constants
+ *
+ * Constants related to message formatters for different LLM providers.
+ * This centralizes string formatting patterns, HTML cleaning options,
+ * and other formatter-specific constants that were previously hardcoded.
+ */
+
+/**
+ * HTML tag allowlists for different formatter strictness levels
+ */
+export const HTML_ALLOWED_TAGS = {
+    // Standard set used by most formatters
+    STANDARD: ['b', 'i', 'em', 'strong', 'a', 'p', 'br', 'ul', 'ol', 'li', 'h1', 'h2', 'h3', 'h4', 'h5', 'code', 'pre'],
+
+    // Minimal set for providers with limited HTML support
+    MINIMAL: ['b', 'i', 'p', 'br', 'a'],
+
+    // Empty set for plain text only (Ollama)
+    NONE: []
+};
+
+/**
+ * HTML attribute allowlists
+ */
+export const HTML_ALLOWED_ATTRIBUTES = {
+    // Standard set of allowed attributes
+    STANDARD: {
+        'a': ['href']
+    },
+
+    // Empty set for plain text only
+    NONE: {}
+};
+
+/**
+ * HTML tag transformations
+ */
+export const HTML_TRANSFORMS = {
+    // Standard transformations
+    STANDARD: {
+        'h1': 'h2',
+        'h2': 'h3',
+        'div': 'p',
+        'span': 'span'
+    }
+};
+
+/**
+ * RegEx patterns for HTML to Markdown conversion
+ */
+export const HTML_TO_MARKDOWN_PATTERNS = {
+    // Headings
+    HEADING_1: { pattern: /<h1[^>]*>(.*?)<\/h1>/gi, replacement: '# $1\n' },
+    HEADING_2: { pattern: /<h2[^>]*>(.*?)<\/h2>/gi, replacement: '## $1\n' },
+    HEADING_3: { pattern: /<h3[^>]*>(.*?)<\/h3>/gi, replacement: '### $1\n' },
+    HEADING_4: { pattern: /<h4[^>]*>(.*?)<\/h4>/gi, replacement: '#### $1\n' },
+    HEADING_5: { pattern: /<h5[^>]*>(.*?)<\/h5>/gi, replacement: '##### $1\n' },
+
+    // Paragraph and line breaks
+    PARAGRAPH: { pattern: /<p[^>]*>(.*?)<\/p>/gi, replacement: '$1\n\n' },
+    BREAK: { pattern: /<br[^>]*>/gi, replacement: '\n' },
+
+    // Links and formatting
+    LINK: { pattern: /<a[^>]*href=["'](.*?)["'][^>]*>(.*?)<\/a>/gi, replacement: '[$2]($1)' },
+    STRONG: { pattern: /<strong[^>]*>(.*?)<\/strong>/gi, replacement: '**$1**' },
+    BOLD: { pattern: /<b[^>]*>(.*?)<\/b>/gi, replacement: '**$1**' },
+    EMPHASIS: { pattern: /<em[^>]*>(.*?)<\/em>/gi, replacement: '*$1*' },
+    ITALIC: { pattern: /<i[^>]*>(.*?)<\/i>/gi, replacement: '*$1*' },
+
+    // Code
+    INLINE_CODE: { pattern: /<code[^>]*>(.*?)<\/code>/gi, replacement: '`$1`' },
+    CODE_BLOCK: { pattern: /<pre[^>]*>(.*?)<\/pre>/gi, replacement: '```\n$1\n```' },
+
+    // Clean up
+    ANY_REMAINING_TAG: { pattern: /<[^>]*>/g, replacement: '' },
+    EXCESSIVE_NEWLINES: { pattern: /\n{3,}/g, replacement: '\n\n' }
+};
+
+/**
+ * HTML entity replacements
+ */
+export const HTML_ENTITY_REPLACEMENTS = {
+    // Common HTML entities
+    NBSP: { pattern: /&nbsp;/g, replacement: ' ' },
+    LT: { pattern: /&lt;/g, replacement: '<' },
+    GT: { pattern: /&gt;/g, replacement: '>' },
+    AMP: { pattern: /&amp;/g, replacement: '&' },
+    QUOT: { pattern: /&quot;/g, replacement: '"' },
+    APOS: { pattern: /&#39;/g, replacement: "'" },
+    LDQUO: { pattern: /&ldquo;/g, replacement: '"' },
+    RDQUO: { pattern: /&rdquo;/g, replacement: '"' },
+    LSQUO: { pattern: /&lsquo;/g, replacement: "'" },
+    RSQUO: { pattern: /&rsquo;/g, replacement: "'" },
+    MDASH: { pattern: /&mdash;/g, replacement: '—' },
+    NDASH: { pattern: /&ndash;/g, replacement: '–' },
+    HELLIP: { pattern: /&hellip;/g, replacement: '…' }
+};
+
+/**
+ * Encoding issue fixes
+ */
+export const ENCODING_FIXES = {
+    // Common encoding issues
+    BROKEN_QUOTES: { pattern: /Γ\u00c2[\u00a3\u00a5]/g, replacement: '"' },
+
+    // Character replacements for Unicode
+    UNICODE_REPLACEMENTS: {
+        '\u00A0': ' ',  // Non-breaking space
+        '\u2018': "'",  // Left single quote
+        '\u2019': "'",  // Right single quote
+        '\u201C': '"',  // Left double quote
+        '\u201D': '"',  // Right double quote
+        '\u2013': '-',  // En dash
+        '\u2014': '--', // Em dash
+        '\u2022': '*',  // Bullet
+        '\u2026': '...' // Ellipsis
+    }
+};
+
+/**
+ * Ollama-specific cleaning patterns
+ */
+export const OLLAMA_CLEANING = {
+    // Replace fancy quotes
+    QUOTES: { pattern: /[""]/g, replacement: '"' },
+    APOSTROPHES: { pattern: /['']/g, replacement: "'" },
+
+    // Replace other Unicode characters
+    DASHES: { pattern: /[–—]/g, replacement: '-' },
+    BULLETS: { pattern: /[•]/g, replacement: '*' },
+    ELLIPSES: { pattern: /[…]/g, replacement: '...' },
+
+    // Remove non-ASCII characters
+    NON_ASCII: { pattern: /[^\x00-\x7F]/g, replacement: '' },
+
+    // Normalize whitespace
+    WHITESPACE: { pattern: /\s+/g, replacement: ' ' },
+    NEWLINE_WHITESPACE: { pattern: /\n\s+/g, replacement: '\n' }
+};
+
+/**
+ * Console log messages for formatters
+ */
+export const FORMATTER_LOGS = {
+    ANTHROPIC: {
+        PROCESSED: (before: number, after: number) => `Anthropic formatter: ${before} messages → ${after} messages`
+    },
+    OPENAI: {
+        PROCESSED: (before: number, after: number) => `OpenAI formatter: ${before} messages → ${after} messages`
+    },
+    OLLAMA: {
+        PROCESSED: (before: number, after: number) => `Ollama formatter processed ${before} messages into ${after} messages`
+    },
+    ERROR: {
+        CONTEXT_CLEANING: (provider: string) => `Error cleaning content for ${provider}:`,
+        ENCODING: 'Error fixing encoding issues:'
+    }
+};
+
+/**
+ * Message formatter text templates
+ */
+export const MESSAGE_FORMATTER_TEMPLATES = {
+    /**
+     * OpenAI-specific message templates
+     */
+    OPENAI: {
+        CONTEXT_INSTRUCTION: 'Please use the following context to respond to the user\'s messages:\n\n'
+    },
+
+    /**
+     * Anthropic-specific message templates
+     */
+    ANTHROPIC: {
+        CONTEXT_START: '\n\n<context>\n',
+        CONTEXT_END: '\n</context>'
+    },
+
+    /**
+     * Ollama-specific message templates
+     */
+    OLLAMA: {
+        REFERENCE_INFORMATION: '\n\nReference information:\n'
+    },
+
+    /**
+     * Default formatter message templates
+     */
+    DEFAULT: {
+        CONTEXT_INSTRUCTION: 'Here is context to help you answer my questions: '
+    }
+};
+
+/**
+ * Provider identifier constants
+ */
+export const PROVIDER_IDENTIFIERS = {
+    OPENAI: 'openai',
+    ANTHROPIC: 'anthropic',
+    OLLAMA: 'ollama',
+    DEFAULT: 'default'
+};
diff --git a/src/services/llm/constants/hierarchy_constants.ts b/src/services/llm/constants/hierarchy_constants.ts
new file mode 100644
index 000000000..40cbedd1f
--- /dev/null
+++ b/src/services/llm/constants/hierarchy_constants.ts
@@ -0,0 +1,35 @@
+/**
+ * Hierarchy Context Constants
+ *
+ * This file centralizes all strings used in the note hierarchy context
+ * functionality. These strings are used when displaying information about parent-child
+ * relationships and note relations in the LLM context building process.
+ */
+
+export const HIERARCHY_STRINGS = {
+    // Parent context strings
+    PARENT_CONTEXT: {
+        NO_PARENT_CONTEXT: 'No parent context available.',
+        CURRENT_NOTE: (title: string) => `${title} (current note)`,
+    },
+
+    // Child context strings
+    CHILD_CONTEXT: {
+        NO_CHILD_NOTES: 'No child notes.',
+        CHILD_NOTES_HEADER: (count: number) => `Child notes (${count} total)`,
+        CHILD_SUMMARY_PREFIX: 'Summary: ',
+        MORE_CHILDREN: (count: number) => `... and ${count} more child notes not shown`,
+        ERROR_RETRIEVING: 'Error retrieving child notes.'
+    },
+
+    // Linked notes context strings
+    LINKED_NOTES: {
+        NO_LINKED_NOTES: 'No linked notes.',
+        OUTGOING_RELATIONS_HEADER: (count: number) => `Outgoing relations (${count} total)`,
+        INCOMING_RELATIONS_HEADER: (count: number) => `Incoming relations (${count} total)`,
+        DEFAULT_RELATION: 'relates to',
+        MORE_OUTGOING: (count: number) => `... and ${count} more outgoing relations not shown`,
+        MORE_INCOMING: (count: number) => `... and ${count} more incoming relations not shown`,
+        ERROR_RETRIEVING: 'Error retrieving linked notes.'
+    }
+};
diff --git a/src/services/llm/constants/llm_prompt_constants.ts b/src/services/llm/constants/llm_prompt_constants.ts
new file mode 100644
index 000000000..68081f9c0
--- /dev/null
+++ b/src/services/llm/constants/llm_prompt_constants.ts
@@ -0,0 +1,298 @@
+/**
+ * LLM Prompt Constants
+ *
+ * This file centralizes all LLM/AI prompts used throughout the application.
+ * When adding new prompts, please add them here rather than hardcoding them in other files.
+ *
+ * Prompts are organized by their usage context (e.g., service, feature, etc.)
+ */
+
+import fs from 'fs';
+import path from 'path';
+import { fileURLToPath } from 'url';
+
+// Load system prompt from markdown file
+const loadSystemPrompt = (): string => {
+    try {
+        const __filename = fileURLToPath(import.meta.url);
+        const __dirname = path.dirname(__filename);
+
+        const promptPath = path.join(__dirname, '../prompts/base_system_prompt.md');
+        const promptContent = fs.readFileSync(promptPath, 'utf8');
+        // Strip the markdown title if needed
+        return promptContent.replace(/^# TriliumNext Base System Prompt\n+/, '');
+    } catch (error) {
+        console.error('Failed to load system prompt from file:', error);
+        // Return fallback prompt if file can't be loaded
+        return "You are a helpful assistant embedded in the TriliumNext Notes application. " +
+            "You can help users with their notes, answer questions, and provide information. " +
+            "Keep your responses concise and helpful. " +
+            "You're currently chatting with the user about their notes.";
+    }
+};
+
+// Base system prompt loaded from markdown file
+export const DEFAULT_SYSTEM_PROMPT = loadSystemPrompt();
+
+/**
+ * System prompts for different use cases
+ */
+export const SYSTEM_PROMPTS = {
+    DEFAULT_SYSTEM_PROMPT:
+        "You are an intelligent AI assistant for Trilium Notes, a hierarchical note-taking application. " +
+        "Help the user with their notes, knowledge management, and questions. " +
+        "When referencing their notes, be clear about which note you're referring to. " +
+        "Be concise but thorough in your responses.",
+
+    AGENT_TOOLS_PROMPT:
+        "You are an intelligent AI assistant for Trilium Notes with access to special tools. " +
+        "You can use these tools to search through the user's notes and find relevant information. " +
+        "Always be helpful, accurate, and respect the user's privacy and security.",
+
+    CONTEXT_AWARE_PROMPT:
+        "You are an intelligent AI assistant for Trilium Notes. " +
+        "You have access to the context from the user's notes. " +
+        "Use this context to provide accurate and helpful responses. " +
+        "Be specific when referencing information from their notes."
+};
+
+// Context-specific prompts
+export const CONTEXT_PROMPTS = {
+    // Query enhancer prompt for generating better search terms
+    QUERY_ENHANCER:
+        `You are an AI assistant that decides what information needs to be retrieved from a user's knowledge base called TriliumNext Notes to answer the user's question.
+Given the user's question, generate 3-5 specific search queries that would help find relevant information.
+Each query should be focused on a different aspect of the question.
+Avoid generating queries that are too broad, vague, or about a user's entire Note database, and make sure they are relevant to the user's question.
+Format your answer as a JSON array of strings, with each string being a search query.
+Example: ["exact topic mentioned", "related concept 1", "related concept 2"]`,
+
+    // Used to format notes context when providing responses
+    CONTEXT_NOTES_WRAPPER:
+        `I'll provide you with relevant information from my notes to help answer your question.
+
+<notes>
+{noteContexts}
+</notes>
+
+When referring to information from these notes in your response, please cite them by their titles (e.g., "According to your note on [Title]...") rather than using labels like "Note 1" or "Note 2".
+
+Now, based on the above information, please answer: <query>{query}</query>`,
+
+    // Default fallback when no notes are found
+    NO_NOTES_CONTEXT:
+        "I am an AI assistant helping you with your Trilium notes. " +
+        "I couldn't find any specific notes related to your query, but I'll try to assist you " +
+        "with general knowledge about Trilium or other topics you're interested in.",
+
+    // Fallback when context building fails
+    ERROR_FALLBACK_CONTEXT:
+        "I'm your AI assistant helping with your Trilium notes. I'll try to answer based on what I know.",
+
+    // Headers for context (by provider)
+    CONTEXT_HEADERS: {
+        ANTHROPIC: (query: string) =>
+            `I'm your AI assistant helping with your Trilium notes database. For your query: "<query>${query}</query>", I found these relevant <notes>`,
+        DEFAULT: (query: string) =>
+            `I've found some relevant information in your notes that may help answer: "<query>${query}</query>"\n\n<notes>`
+    },
+
+    // Closings for context (by provider)
+    CONTEXT_CLOSINGS: {
+        ANTHROPIC:
+            "</notes>\n\nPlease use this information to answer the user's query. If the notes don't contain enough information, you can use your general knowledge as well.",
+        DEFAULT:
+            "</notes>\n\nBased on this information from the user's notes, please provide a helpful response."
+    },
+
+    // Context for index service
+    INDEX_NO_NOTES_CONTEXT:
+        "I'm an AI assistant helping with your Trilium notes. I couldn't find specific notes related to your query, but I'll try to assist based on general knowledge.",
+
+    // Prompt for adding note context to chat
+    NOTE_CONTEXT_PROMPT: `Here is the content of the note I want to discuss:
+
+<note_content>
+{context}
+</note_content>
+
+Please help me with this information.`,
+
+    // Prompt for adding semantic note context to chat
+    SEMANTIC_NOTE_CONTEXT_PROMPT: `Here is the relevant information from my notes based on my query "<query>{query}</query>":
+
+<notes_context>
+{context}
+</notes_context>
+
+Please help me understand this information in relation to my query.`,
+
+    // System message prompt for context-aware chat
+    CONTEXT_AWARE_SYSTEM_PROMPT: `You are an AI assistant helping with Trilium Notes. Use this context to answer the user's question:
+
+<enhanced_context>
+{enhancedContext}
+</enhanced_context>`,
+
+    // Error messages
+    ERROR_MESSAGES: {
+        GENERAL_ERROR: `Error: Failed to generate response. {errorMessage}`,
+        CONTEXT_ERROR: `Error: Failed to generate response with note context. {errorMessage}`
+    },
+
+    // Merged from JS file
+    AGENT_TOOLS_CONTEXT_PROMPT:
+        "You have access to the following tools to help answer the user's question: <tools>{tools}</tools>"
+};
+
+// Agent tool prompts
+export const AGENT_TOOL_PROMPTS = {
+    // Prompts for query decomposition
+    QUERY_DECOMPOSITION: {
+        SUB_QUERY_DIRECT: '<query_type>Direct question that can be answered without decomposition</query_type>',
+        SUB_QUERY_GENERIC: '<query_type>Generic exploration to find related content</query_type>',
+        SUB_QUERY_ERROR: '<query_type>Error in decomposition, treating as simple query</query_type>',
+        SUB_QUERY_DIRECT_ANALYSIS: '<query_type>Direct analysis of note details</query_type>',
+        ORIGINAL_QUERY: '<query_type>Original query</query_type>'
+    },
+
+    // Prompts for contextual thinking tool
+    CONTEXTUAL_THINKING: {
+        STARTING_ANALYSIS: (query: string) => `Starting analysis of the query: "<query>${query}</query>"`,
+        KEY_COMPONENTS: '<analysis>What are the key components of this query that need to be addressed?</analysis>',
+        BREAKING_DOWN: '<analysis>Breaking down the query to understand its requirements and context.</analysis>'
+    }
+};
+
+// Provider-specific prompt modifiers
+export const PROVIDER_PROMPTS = {
+    ANTHROPIC: {
+        // Anthropic Claude-specific prompt formatting
+        SYSTEM_WITH_CONTEXT: (context: string) =>
+            `<instructions>
+${DEFAULT_SYSTEM_PROMPT}
+
+Use the following information from the user's notes to answer their questions:
+
+<user_notes>
+${context}
+</user_notes>
+
+When responding:
+- Focus on the most relevant information from the notes
+- Be concise and direct in your answers
+- If quoting from notes, mention which note it's from
+- If the notes don't contain relevant information, say so clearly
+</instructions>`,
+
+        INSTRUCTIONS_WRAPPER: (instructions: string) =>
+            `<instructions>\n${instructions}\n</instructions>`,
+
+        ACKNOWLEDGMENT: "I understand. I'll follow those instructions.",
+        CONTEXT_ACKNOWLEDGMENT: "I'll help you with your notes based on the context provided.",
+        CONTEXT_QUERY_ACKNOWLEDGMENT: "I'll help you with your notes based on the context provided. What would you like to know?"
+    },
+
+    OPENAI: {
+        // OpenAI-specific prompt formatting
+        SYSTEM_WITH_CONTEXT: (context: string) =>
+            `<system_prompt>
+You are an AI assistant integrated into TriliumNext Notes.
+Use the following information from the user's notes to answer their questions:
+
+<user_notes>
+${context}
+</user_notes>
+
+Focus on relevant information from these notes when answering.
+Be concise and informative in your responses.
+</system_prompt>`
+    },
+
+    OLLAMA: {
+        // Ollama-specific prompt formatting
+        CONTEXT_INJECTION: (context: string, query: string) =>
+            `Here's information from my notes to help answer the question:
+
+${context}
+
+Based on this information, please answer: <query>${query}</query>`
+    },
+
+    // Common prompts across providers
+    COMMON: {
+        DEFAULT_ASSISTANT_INTRO: "<assistant_role>You are an AI assistant integrated into TriliumNext Notes. Focus on helping users find information in their notes and answering questions based on their knowledge base. Be concise, informative, and direct when responding to queries.</assistant_role>"
+    }
+};
+
+// Constants for formatting context and messages
+export const FORMATTING_PROMPTS = {
+    // Headers for context formatting
+    CONTEXT_HEADERS: {
+        SIMPLE: (query: string) => `I'm searching for information about: <query>${query}</query>\n\n<notes>Here are the most relevant notes from my knowledge base:`,
+        DETAILED: (query: string) => `I'm searching for information about: "<query>${query}</query>"\n\n<notes>Here are the most relevant notes from my personal knowledge base:`
+    },
+
+    // Closing text for context formatting
+    CONTEXT_CLOSERS: {
+        SIMPLE: `</notes>\nEnd of notes. Please use this information to answer my question comprehensively.`,
+        DETAILED: `</notes>\nEnd of context information. Please use only the above notes to answer my question as comprehensively as possible.`
+    },
+
+    // Dividers used in context formatting
+    DIVIDERS: {
+        NOTE_SECTION: `------ NOTE INFORMATION ------`,
+        CONTENT_SECTION: `------ CONTEXT INFORMATION ------`,
+        NOTE_START: `# Note: `,
+        CONTENT_START: `Content: `
+    },
+
+    HTML_ALLOWED_TAGS: ['b', 'i', 'em', 'strong', 'a', 'p', 'br', 'ul', 'ol', 'li', 'h1', 'h2', 'h3', 'h4', 'h5', 'code', 'pre']
+};
+
+// Prompt templates for chat service
+export const CHAT_PROMPTS = {
+    // Introduction messages for new chats
+    INTRODUCTIONS: {
+        NEW_CHAT: "<greeting>Welcome to TriliumNext AI Assistant. How can I help you with your notes today?</greeting>",
+        SEMANTIC_SEARCH: "<instruction>I'll search through your notes for relevant information. What would you like to know?</instruction>"
+    },
+
+    // Placeholders for various chat scenarios
+    PLACEHOLDERS: {
+        NO_CONTEXT: "<status>I don't have any specific note context yet. Would you like me to search your notes for something specific?</status>",
+        WAITING_FOR_QUERY: "<prompt>Awaiting your question...</prompt>"
+    }
+};
+
+// Error messages and fallbacks
+export const ERROR_PROMPTS = {
+    // User-facing error messages
+    USER_ERRORS: {
+        GENERAL_ERROR: "I encountered an error processing your request. Please try again or rephrase your question.",
+        CONTEXT_ERROR: "I couldn't retrieve context from your notes. Please check your query or try a different question.",
+        NETWORK_ERROR: "There was a network error connecting to the AI service. Please check your connection and try again.",
+        RATE_LIMIT: "The AI service is currently experiencing high demand. Please try again in a moment.",
+
+        // Merged from JS file
+        PROVIDER_ERROR:
+            "I'm sorry, but there seems to be an issue with the AI service provider. " +
+            "Please check your connection and API settings, or try again later."
+    },
+
+    // Internal error handling
+    INTERNAL_ERRORS: {
+        CONTEXT_PROCESSING: "Error processing context data",
+        MESSAGE_FORMATTING: "Error formatting messages for LLM",
+        RESPONSE_PARSING: "Error parsing LLM response"
+    },
+
+    // Merged from JS file
+    SYSTEM_ERRORS: {
+        NO_PROVIDER_AVAILABLE:
+            "No AI provider is available. Please check your AI settings and ensure at least one provider is configured properly.",
+
+        UNAUTHORIZED:
+            "The AI provider returned an authorization error. Please check your API key settings."
+    }
+};
diff --git a/src/services/llm/constants/provider_constants.ts b/src/services/llm/constants/provider_constants.ts
new file mode 100644
index 000000000..e1cccecc6
--- /dev/null
+++ b/src/services/llm/constants/provider_constants.ts
@@ -0,0 +1,215 @@
+export const PROVIDER_CONSTANTS = {
+    ANTHROPIC: {
+        API_VERSION: '2023-06-01',
+        BETA_VERSION: 'messages-2023-12-15',
+        BASE_URL: 'https://api.anthropic.com',
+        DEFAULT_MODEL: 'claude-3-haiku-20240307',
+        // Model mapping for simplified model names to their full versions
+        MODEL_MAPPING: {
+            'claude-3.7-sonnet': 'claude-3-7-sonnet-20250219',
+            'claude-3.5-sonnet': 'claude-3-5-sonnet-20241022',
+            'claude-3.5-haiku': 'claude-3-5-haiku-20241022',
+            'claude-3-opus': 'claude-3-opus-20240229',
+            'claude-3-sonnet': 'claude-3-sonnet-20240229',
+            'claude-3-haiku': 'claude-3-haiku-20240307',
+            'claude-2': 'claude-2.1'
+        },
+        // These are the currently available models from Anthropic
+        AVAILABLE_MODELS: [
+            {
+                id: 'claude-3-7-sonnet-20250219',
+                name: 'Claude 3.7 Sonnet',
+                description: 'Most intelligent model with hybrid reasoning capabilities',
+                maxTokens: 8192
+            },
+            {
+                id: 'claude-3-5-sonnet-20241022',
+                name: 'Claude 3.5 Sonnet',
+                description: 'High level of intelligence and capability',
+                maxTokens: 8192
+            },
+            {
+                id: 'claude-3-5-haiku-20241022',
+                name: 'Claude 3.5 Haiku',
+                description: 'Fastest model with high intelligence',
+                maxTokens: 8192
+            },
+            {
+                id: 'claude-3-opus-20240229',
+                name: 'Claude 3 Opus',
+                description: 'Most capable model for highly complex tasks',
+                maxTokens: 8192
+            },
+            {
+                id: 'claude-3-sonnet-20240229',
+                name: 'Claude 3 Sonnet',
+                description: 'Ideal balance of intelligence and speed',
+                maxTokens: 8192
+            },
+            {
+                id: 'claude-3-haiku-20240307',
+                name: 'Claude 3 Haiku',
+                description: 'Fastest and most compact model',
+                maxTokens: 8192
+            },
+            {
+                id: 'claude-2.1',
+                name: 'Claude 2.1',
+                description: 'Previous generation model',
+                maxTokens: 8192
+            }
+        ]
+    },
+
+    OPENAI: {
+        BASE_URL: 'https://api.openai.com/v1',
+        DEFAULT_MODEL: 'gpt-3.5-turbo',
+        DEFAULT_EMBEDDING_MODEL: 'text-embedding-ada-002',
+        CONTEXT_WINDOW: 16000,
+        EMBEDDING_DIMENSIONS: {
+            ADA: 1536,
+            DEFAULT: 1536
+        },
+        AVAILABLE_MODELS: [
+            {
+                id: 'gpt-4o',
+                name: 'GPT-4o',
+                description: 'Most capable multimodal model',
+                maxTokens: 8192
+            },
+            {
+                id: 'gpt-4-turbo',
+                name: 'GPT-4 Turbo',
+                description: 'Advanced capabilities with higher token limit',
+                maxTokens: 8192
+            },
+            {
+                id: 'gpt-4',
+                name: 'GPT-4',
+                description: 'Original GPT-4 model',
+                maxTokens: 8192
+            },
+            {
+                id: 'gpt-3.5-turbo',
+                name: 'GPT-3.5 Turbo',
+                description: 'Fast and efficient model for most tasks',
+                maxTokens: 8192
+            }
+        ]
+    },
+
+    OLLAMA: {
+        BASE_URL: 'http://localhost:11434',
+        DEFAULT_MODEL: 'llama2',
+        BATCH_SIZE: 100,
+        CHUNKING: {
+            SIZE: 4000,
+            OVERLAP: 200
+        },
+        MODEL_DIMENSIONS: {
+            default: 8192,
+            llama2: 8192,
+            mixtral: 8192,
+            'mistral': 8192
+        },
+        MODEL_CONTEXT_WINDOWS: {
+            default: 8192,
+            llama2: 8192,
+            mixtral: 8192,
+            'mistral': 8192
+        }
+    }
+} as const;
+
+// LLM service configuration constants
+export const LLM_CONSTANTS = {
+    // Context window sizes (in characters)
+    CONTEXT_WINDOW: {
+        OLLAMA: 8000,
+        OPENAI: 12000,
+        ANTHROPIC: 15000,
+        VOYAGE: 12000,
+        DEFAULT: 6000
+    },
+
+    // Embedding dimensions (verify these with your actual models)
+    EMBEDDING_DIMENSIONS: {
+        OLLAMA: {
+            DEFAULT: 384,
+            NOMIC: 768,
+            MISTRAL: 1024
+        },
+        OPENAI: {
+            ADA: 1536,
+            DEFAULT: 1536
+        },
+        ANTHROPIC: {
+            CLAUDE: 1024,
+            DEFAULT: 1024
+        },
+        VOYAGE: {
+            DEFAULT: 1024
+        }
+    },
+
+    // Model-specific embedding dimensions for Ollama models
+    OLLAMA_MODEL_DIMENSIONS: {
+        "llama3": 8192,
+        "llama3.1": 8192,
+        "mistral": 8192,
+        "nomic": 768,
+        "mxbai": 1024,
+        "nomic-embed-text": 768,
+        "mxbai-embed-large": 1024,
+        "default": 384
+    },
+
+    // Model-specific context windows for Ollama models
+    OLLAMA_MODEL_CONTEXT_WINDOWS: {
+        "llama3": 8192,
+        "llama3.1": 8192,
+        "llama3.2": 8192,
+        "mistral": 8192,
+        "nomic": 32768,
+        "mxbai": 32768,
+        "nomic-embed-text": 32768,
+        "mxbai-embed-large": 32768,
+        "default": 8192
+    },
+
+    // Batch size configuration
+    BATCH_SIZE: {
+        OPENAI: 10,     // OpenAI can handle larger batches efficiently
+        ANTHROPIC: 5,   // More conservative for Anthropic
+        OLLAMA: 1,      // Ollama processes one at a time
+        DEFAULT: 5      // Conservative default
+    },
+
+    // Chunking parameters
+    CHUNKING: {
+        DEFAULT_SIZE: 1500,
+        OLLAMA_SIZE: 1000,
+        DEFAULT_OVERLAP: 100,
+        MAX_SIZE_FOR_SINGLE_EMBEDDING: 5000
+    },
+
+    // Search/similarity thresholds
+    SIMILARITY: {
+        DEFAULT_THRESHOLD: 0.65,
+        HIGH_THRESHOLD: 0.75,
+        LOW_THRESHOLD: 0.5
+    },
+
+    // Session management
+    SESSION: {
+        CLEANUP_INTERVAL_MS: 60 * 60 * 1000, // 1 hour
+        SESSION_EXPIRY_MS: 12 * 60 * 60 * 1000, // 12 hours
+        MAX_SESSION_MESSAGES: 10
+    },
+
+    // Content limits
+    CONTENT: {
+        MAX_NOTE_CONTENT_LENGTH: 1500,
+        MAX_TOTAL_CONTENT_LENGTH: 10000
+    }
+};
diff --git a/src/services/llm/constants/query_decomposition_constants.ts b/src/services/llm/constants/query_decomposition_constants.ts
new file mode 100644
index 000000000..2c6df4386
--- /dev/null
+++ b/src/services/llm/constants/query_decomposition_constants.ts
@@ -0,0 +1,95 @@
+/**
+ * Query Decomposition Constants
+ *
+ * This file centralizes all string constants used in the query decomposition tool.
+ * These constants can be translated for internationalization support.
+ */
+
+export const QUERY_DECOMPOSITION_STRINGS = {
+    // Log messages
+    LOG_MESSAGES: {
+        DECOMPOSING_QUERY: (query: string) => `Decomposing query: "${query.substring(0, 100)}..."`,
+        EMPTY_QUERY: "Query decomposition called with empty query",
+        COMPLEXITY_ASSESSMENT: (complexity: number) => `Query complexity assessment: ${complexity}/10`,
+        SIMPLE_QUERY: (complexity: number) => `Query is simple (complexity ${complexity}), returning as single sub-query`,
+        DECOMPOSED_INTO: (count: number) => `Decomposed query into ${count} sub-queries`,
+        SUB_QUERY_LOG: (index: number, text: string, reason: string) => `Sub-query ${index + 1}: "${text}" - Reason: ${reason}`,
+        ERROR_DECOMPOSING: (error: string) => `Error decomposing query: ${error}`,
+        AVOIDING_RECURSIVE: (query: string) => `Avoiding recursive subqueries for query "${query.substring(0, 50)}..."`,
+        ERROR_SYNTHESIZING: (error: string) => `Error synthesizing answer: ${error}`
+    },
+
+    // Query identification patterns
+    QUERY_PATTERNS: {
+        PROVIDE_DETAILS_ABOUT: "provide details about",
+        INFORMATION_RELATED_TO: "information related to",
+        COMPARE: "compare",
+        DIFFERENCE_BETWEEN: "difference between",
+        VS: " vs ",
+        VERSUS: "versus",
+        HOW_TO: "how to ",
+        WHY: "why ",
+        WHAT_IS: "what is ",
+        WHAT_ARE: "what are "
+    },
+
+    // Question words used for complexity assessment
+    QUESTION_WORDS: ['what', 'how', 'why', 'where', 'when', 'who', 'which'],
+
+    // Conjunctions used for complexity assessment
+    CONJUNCTIONS: ['and', 'or', 'but', 'as well as'],
+
+    // Comparison terms used for complexity assessment
+    COMPARISON_TERMS: ['compare', 'versus', 'vs', 'difference', 'similarities'],
+
+    // Analysis terms used for complexity assessment
+    ANALYSIS_TERMS: ['analyze', 'examine', 'investigate', 'explore', 'explain', 'discuss'],
+
+    // Common stop words for parsing
+    STOP_WORDS: ['the', 'of', 'and', 'or', 'vs', 'versus', 'between', 'comparison', 'compared', 'to', 'with', 'what', 'is', 'are', 'how', 'why', 'when', 'which'],
+
+    // Sub-query templates
+    SUB_QUERY_TEMPLATES: {
+        INFORMATION_RELATED: (query: string) => `Information related to ${query}`,
+        KEY_CHARACTERISTICS: (entity: string) => `What are the key characteristics of ${entity}?`,
+        COMPARISON_FEATURES: (entities: string[]) => `How do ${entities.join(' and ')} compare in terms of their primary features?`,
+        STEPS_TO: (topic: string) => `What are the steps to ${topic}?`,
+        CHALLENGES: (topic: string) => `What are common challenges or pitfalls when trying to ${topic}?`,
+        CAUSES: (topic: string) => `What are the causes of ${topic}?`,
+        EVIDENCE: (topic: string) => `What evidence supports explanations for ${topic}?`,
+        DEFINITION: (topic: string) => `Definition of ${topic}`,
+        EXAMPLES: (topic: string) => `Examples of ${topic}`,
+        KEY_INFORMATION: (concept: string) => `Key information about ${concept}`
+    },
+
+    // Sub-query reasons
+    SUB_QUERY_REASONS: {
+        GETTING_DETAILS: (entity: string) => `Getting details about "${entity}" for comparison`,
+        DIRECT_COMPARISON: 'Direct comparison of the entities',
+        FINDING_PROCEDURAL: 'Finding procedural information',
+        IDENTIFYING_DIFFICULTIES: 'Identifying potential difficulties',
+        IDENTIFYING_CAUSES: 'Identifying causes',
+        FINDING_EVIDENCE: 'Finding supporting evidence',
+        GETTING_DEFINITION: 'Getting basic definition',
+        FINDING_EXAMPLES: 'Finding examples',
+        FINDING_INFORMATION: (concept: string) => `Finding information about "${concept}"`
+    },
+
+    // Synthesis answer templates
+    SYNTHESIS_TEMPLATES: {
+        CANNOT_SYNTHESIZE: "Cannot synthesize answer - not all sub-queries have been answered.",
+        ANSWER_TO: (query: string) => `Answer to: "${query}"\n\n`,
+        BASED_ON_INFORMATION: "Based on the information gathered:\n\n",
+        ERROR_SYNTHESIZING: "Error synthesizing the final answer."
+    },
+
+    // Query status templates
+    STATUS_TEMPLATES: {
+        PROGRESS: (answered: number, total: number) => `Progress: ${answered}/${total} sub-queries answered\n\n`,
+        ANSWERED_MARKER: "✓",
+        UNANSWERED_MARKER: "○",
+        ANSWER_PREFIX: "   Answer: "
+    }
+};
+
+export default QUERY_DECOMPOSITION_STRINGS;
diff --git a/src/services/llm/constants/search_constants.ts b/src/services/llm/constants/search_constants.ts
new file mode 100644
index 000000000..bc1689961
--- /dev/null
+++ b/src/services/llm/constants/search_constants.ts
@@ -0,0 +1,137 @@
+export const SEARCH_CONSTANTS = {
+    // Vector search parameters
+    VECTOR_SEARCH: {
+        DEFAULT_MAX_RESULTS: 10,
+        DEFAULT_THRESHOLD: 0.6,
+        SIMILARITY_THRESHOLD: {
+            COSINE: 0.6,
+            HYBRID: 0.3,
+            DIM_AWARE: 0.1
+        },
+        EXACT_MATCH_THRESHOLD: 0.65
+    },
+
+    // Context extraction parameters
+    CONTEXT: {
+        CONTENT_LENGTH: {
+            MEDIUM_THRESHOLD: 5000,
+            HIGH_THRESHOLD: 10000
+        },
+        MAX_PARENT_DEPTH: 3,
+        MAX_CHILDREN: 10,
+        MAX_LINKS: 10,
+        MAX_SIMILAR_NOTES: 5,
+        MAX_CONTENT_LENGTH: 2000,
+        MAX_RELATIONS: 10,
+        MAX_POINTS: 5
+    },
+
+    // Hierarchy parameters
+    HIERARCHY: {
+        DEFAULT_QUERY_DEPTH: 2,
+        MAX_NOTES_PER_QUERY: 10,
+        MAX_PATH_LENGTH: 20,
+        MAX_BREADTH: 100,
+        MAX_DEPTH: 5,
+        MAX_PATHS_TO_SHOW: 3
+    },
+
+    // Temperature settings
+    TEMPERATURE: {
+        DEFAULT: 0.7,
+        RELATIONSHIP_TOOL: 0.4,
+        VECTOR_SEARCH: 0.3,
+        QUERY_PROCESSOR: 0.3
+    },
+
+    // Token/char limits
+    LIMITS: {
+        DEFAULT_NOTE_SUMMARY_LENGTH: 500,
+        DEFAULT_MAX_TOKENS: 4096,
+        RELATIONSHIP_TOOL_MAX_TOKENS: 50,
+        VECTOR_SEARCH_MAX_TOKENS: 500,
+        QUERY_PROCESSOR_MAX_TOKENS: 300,
+        MIN_STRING_LENGTH: 3
+    },
+
+    // Tool execution parameters
+    TOOL_EXECUTION: {
+        MAX_TOOL_CALL_ITERATIONS: 5,
+        MAX_FOLLOW_UP_ITERATIONS: 3
+    }
+};
+
+// Model capabilities constants - moved from ./interfaces/model_capabilities.ts
+export const MODEL_CAPABILITIES = {
+    'gpt-3.5-turbo': {
+        contextWindowTokens: 8192,
+        contextWindowChars: 16000
+    },
+    'gpt-4': {
+        contextWindowTokens: 8192
+    },
+    'gpt-4-turbo': {
+        contextWindowTokens: 8192
+    },
+    'claude-3-opus': {
+        contextWindowTokens: 200000
+    },
+    'claude-3-sonnet': {
+        contextWindowTokens: 180000
+    },
+    'claude-3.5-sonnet': {
+        contextWindowTokens: 200000
+    },
+    'default': {
+        contextWindowTokens: 4096
+    }
+};
+
+// Embedding processing constants
+export const EMBEDDING_PROCESSING = {
+    MAX_TOTAL_PROCESSING_TIME: 5 * 60 * 1000, // 5 minutes
+    MAX_CHUNK_RETRY_ATTEMPTS: 2,
+    DEFAULT_MAX_CHUNK_PROCESSING_TIME: 60 * 1000, // 1 minute
+    OLLAMA_MAX_CHUNK_PROCESSING_TIME: 120 * 1000, // 2 minutes
+    DEFAULT_EMBEDDING_UPDATE_INTERVAL: 200
+};
+
+// Provider-specific embedding capabilities
+export const PROVIDER_EMBEDDING_CAPABILITIES = {
+    VOYAGE: {
+        MODELS: {
+            'voyage-large-2': {
+                contextWidth: 8192,
+                dimension: 1536
+            },
+            'voyage-2': {
+                contextWidth: 8192,
+                dimension: 1024
+            },
+            'voyage-lite-02': {
+                contextWidth: 8192,
+                dimension: 768
+            },
+            'default': {
+                contextWidth: 8192,
+                dimension: 1024
+            }
+        }
+    },
+    OPENAI: {
+        MODELS: {
+            'text-embedding-3-small': {
+                dimension: 1536,
+                contextWindow: 8191
+            },
+            'text-embedding-3-large': {
+                dimension: 3072,
+                contextWindow: 8191
+            },
+            'default': {
+                dimension: 1536,
+                contextWindow: 8192
+            }
+        }
+    }
+};
diff --git a/src/services/llm/context/code_handlers.ts b/src/services/llm/context/code_handlers.ts
new file mode 100644
index 000000000..f4b1fca97
--- /dev/null
+++ b/src/services/llm/context/code_handlers.ts
@@ -0,0 +1,438 @@
+/**
+ * Helper functions for processing code notes, including language detection and structure extraction
+ */
+
+// Import highlight.js dynamically when needed
+let hljs: object | null = null;
+
+/**
+ * Attempt to detect the programming language from code content or note attributes
+ */
+export function detectLanguage(content: string, mime: string): string {
+    // First check MIME type for hints
+    if (mime) {
+        const mimeLower = mime.toLowerCase();
+
+        // Map of mime types to language names
+        const mimeMap: {[key: string]: string} = {
+            'text/javascript': 'javascript',
+            'application/javascript': 'javascript',
+            'text/typescript': 'typescript',
+            'application/typescript': 'typescript',
+            'text/x-python': 'python',
+            'text/x-java': 'java',
+            'text/x-c': 'c',
+            'text/x-c++': 'cpp',
+            'text/x-csharp': 'csharp',
+            'text/x-go': 'go',
+            'text/x-ruby': 'ruby',
+            'text/x-php': 'php',
+            'text/x-rust': 'rust',
+            'text/x-swift': 'swift',
+            'text/x-kotlin': 'kotlin',
+            'text/x-scala': 'scala',
+            'text/x-perl': 'perl',
+            'text/x-lua': 'lua',
+            'text/x-r': 'r',
+            'text/x-dart': 'dart',
+            'text/html': 'html',
+            'text/css': 'css',
+            'application/json': 'json',
+            'application/xml': 'xml',
+            'text/markdown': 'markdown',
+            'text/yaml': 'yaml',
+            'text/x-sql': 'sql'
+        };
+
+        if (mimeMap[mimeLower]) {
+            return mimeMap[mimeLower];
+        }
+    }
+
+    // Fallback to regex-based detection if highlight.js is not available or fails
+    // Check for common language patterns in the first few lines
+    const firstLines = content.split('\n').slice(0, 10).join('\n');
+
+    // Simple heuristics for common languages
+    if (firstLines.includes('<?php')) return 'php';
+    if (firstLines.includes('#!/usr/bin/python') || firstLines.includes('import ') && firstLines.includes('def ')) return 'python';
+    if (firstLines.includes('#!/bin/bash') || firstLines.includes('#!/usr/bin/bash')) return 'bash';
+    if (firstLines.includes('#!/usr/bin/perl')) return 'perl';
+    if (firstLines.includes('#!/usr/bin/ruby')) return 'ruby';
+    if (firstLines.includes('package ') && firstLines.includes('import ') && firstLines.includes('public class ')) return 'java';
+    if (firstLines.includes('using System;') && firstLines.includes('namespace ')) return 'csharp';
+    if (firstLines.includes('package main') && firstLines.includes('import (') && firstLines.includes('func ')) return 'go';
+    if (firstLines.includes('#include <') && (firstLines.includes('int main(') || firstLines.includes('void main('))) {
+        if (firstLines.includes('std::')) return 'cpp';
+        return 'c';
+    }
+    if (firstLines.includes('fn main()') && firstLines.includes('let ') && firstLines.includes('impl ')) return 'rust';
+    if (firstLines.includes('<!DOCTYPE html>') || firstLines.includes('<html>')) return 'html';
+    if (firstLines.includes('function ') && firstLines.includes('var ') && firstLines.includes('const ')) return 'javascript';
+    if (firstLines.includes('interface ') && firstLines.includes('export class ')) return 'typescript';
+    if (firstLines.includes('@Component') || firstLines.includes('import { Component }')) return 'typescript';
+
+    // Default to 'text' if language can't be determined
+    return 'text';
+}
+
+/**
+ * Extract structure from code to create a summary
+ */
+export function extractCodeStructure(content: string, language: string): string {
+    // Avoid processing very large code files
+    if (content.length > 100000) {
+        return "Code content too large for structure extraction";
+    }
+
+    let structure = "";
+
+    try {
+        switch (language.toLowerCase()) {
+            case 'javascript':
+            case 'typescript':
+                structure = extractJsStructure(content);
+                break;
+
+            case 'python':
+                structure = extractPythonStructure(content);
+                break;
+
+            case 'java':
+            case 'csharp':
+            case 'cpp':
+                structure = extractClassBasedStructure(content);
+                break;
+
+            case 'go':
+                structure = extractGoStructure(content);
+                break;
+
+            case 'rust':
+                structure = extractRustStructure(content);
+                break;
+
+            case 'html':
+                structure = extractHtmlStructure(content);
+                break;
+
+            default:
+                // For other languages, just return a summary of the file size and a few lines
+                const lines = content.split('\n');
+                structure = `Code file with ${lines.length} lines.\n`;
+
+                // Add first few non-empty lines that aren't comments
+                const firstCodeLines = lines.filter(line =>
+                    line.trim() !== '' &&
+                    !line.trim().startsWith('//') &&
+                    !line.trim().startsWith('#') &&
+                    !line.trim().startsWith('*') &&
+                    !line.trim().startsWith('<!--')
+                ).slice(0, 5);
+
+                if (firstCodeLines.length > 0) {
+                    structure += "First few code lines:\n" + firstCodeLines.join('\n');
+                }
+        }
+    } catch (e: unknown) {
+        const errorMessage = e instanceof Error ? e.message : String(e);
+        return `Error extracting code structure: ${errorMessage}`;
+    }
+
+    return structure;
+}
+
+/**
+ * Extract structure from JavaScript/TypeScript code
+ */
+function extractJsStructure(content: string): string {
+    const lines = content.split('\n');
+    let structure = "";
+
+    // Look for imports/requires
+    const imports = lines.filter(line =>
+        line.trim().startsWith('import ') ||
+        line.includes('require(')
+    ).slice(0, 10);
+
+    if (imports.length > 0) {
+        structure += "Imports:\n" + imports.join('\n') + '\n\n';
+    }
+
+    // Look for class declarations
+    const classes = [];
+    for (let i = 0; i < lines.length; i++) {
+        const line = lines[i].trim();
+        if (line.startsWith('class ') || line.includes(' class ')) {
+            classes.push(line);
+        }
+    }
+
+    if (classes.length > 0) {
+        structure += "Classes:\n" + classes.join('\n') + '\n\n';
+    }
+
+    // Look for function declarations
+    const functions = [];
+    for (let i = 0; i < lines.length; i++) {
+        const line = lines[i].trim();
+        if (line.startsWith('function ') ||
+            line.match(/^(const|let|var)\s+\w+\s*=\s*function/) ||
+            line.match(/^(const|let|var)\s+\w+\s*=\s*\(/)) {
+            functions.push(line);
+        }
+    }
+
+    if (functions.length > 0) {
+        structure += "Functions:\n" + functions.slice(0, 15).join('\n');
+        if (functions.length > 15) {
+            structure += `\n... and ${functions.length - 15} more functions`;
+        }
+        structure += '\n\n';
+    }
+
+    return structure;
+}
+
+/**
+ * Extract structure from Python code
+ */
+function extractPythonStructure(content: string): string {
+    const lines = content.split('\n');
+    let structure = "";
+
+    // Look for imports
+    const imports = lines.filter(line =>
+        line.trim().startsWith('import ') ||
+        line.trim().startsWith('from ')
+    ).slice(0, 10);
+
+    if (imports.length > 0) {
+        structure += "Imports:\n" + imports.join('\n') + '\n\n';
+    }
+
+    // Look for class declarations
+    const classes = [];
+    for (let i = 0; i < lines.length; i++) {
+        const line = lines[i].trim();
+        if (line.startsWith('class ')) {
+            classes.push(line);
+        }
+    }
+
+    if (classes.length > 0) {
+        structure += "Classes:\n" + classes.join('\n') + '\n\n';
+    }
+
+    // Look for function declarations
+    const functions = [];
+    for (let i = 0; i < lines.length; i++) {
+        const line = lines[i].trim();
+        if (line.startsWith('def ')) {
+            functions.push(line);
+        }
+    }
+
+    if (functions.length > 0) {
+        structure += "Functions:\n" + functions.slice(0, 15).join('\n');
+        if (functions.length > 15) {
+            structure += `\n... and ${functions.length - 15} more functions`;
+        }
+        structure += '\n\n';
+    }
+
+    return structure;
+}
+
+/**
+ * Extract structure from class-based languages like Java, C#, C++
+ */
+function extractClassBasedStructure(content: string): string {
+    const lines = content.split('\n');
+    let structure = "";
+
+    // Look for package/namespace declarations
+    const packageLines = lines.filter(line =>
+        line.trim().startsWith('package ') ||
+        line.trim().startsWith('namespace ') ||
+        line.trim().startsWith('using ')
+    ).slice(0, 5);
+
+    if (packageLines.length > 0) {
+        structure += "Package/Imports:\n" + packageLines.join('\n') + '\n\n';
+    }
+
+    // Look for class declarations
+    const classes = [];
+    for (let i = 0; i < lines.length; i++) {
+        const line = lines[i].trim();
+        if (line.match(/^(public|private|protected)?\s*(class|interface|enum)\s+\w+/)) {
+            classes.push(line);
+        }
+    }
+
+    if (classes.length > 0) {
+        structure += "Classes/Interfaces:\n" + classes.join('\n') + '\n\n';
+    }
+
+    // Look for method declarations
+    const methods = [];
+    for (let i = 0; i < lines.length; i++) {
+        const line = lines[i].trim();
+        if (line.match(/^(public|private|protected)?\s*(static)?\s*[\w<>[\]]+\s+\w+\s*\(/)) {
+            methods.push(line);
+        }
+    }
+
+    if (methods.length > 0) {
+        structure += "Methods:\n" + methods.slice(0, 15).join('\n');
+        if (methods.length > 15) {
+            structure += `\n... and ${methods.length - 15} more methods`;
+        }
+        structure += '\n\n';
+    }
+
+    return structure;
+}
+
+/**
+ * Extract structure from Go code
+ */
+function extractGoStructure(content: string): string {
+    const lines = content.split('\n');
+    let structure = "";
+
+    // Look for package declarations
+    const packageLines = lines.filter(line => line.trim().startsWith('package ')).slice(0, 1);
+
+    if (packageLines.length > 0) {
+        structure += "Package:\n" + packageLines.join('\n') + '\n\n';
+    }
+
+    // Look for imports
+    const importStart = lines.findIndex(line => line.trim() === 'import (');
+    if (importStart !== -1) {
+        let importEnd = lines.findIndex((line, i) => i > importStart && line.trim() === ')');
+        if (importEnd !== -1) {
+            structure += "Imports:\n" + lines.slice(importStart, importEnd + 1).join('\n') + '\n\n';
+        }
+    }
+
+    // Look for type declarations (structs, interfaces)
+    const types = [];
+    for (let i = 0; i < lines.length; i++) {
+        const line = lines[i].trim();
+        if (line.startsWith('type ') && (line.includes(' struct ') || line.includes(' interface '))) {
+            types.push(line);
+        }
+    }
+
+    if (types.length > 0) {
+        structure += "Types:\n" + types.join('\n') + '\n\n';
+    }
+
+    // Look for function declarations
+    const functions = [];
+    for (let i = 0; i < lines.length; i++) {
+        const line = lines[i].trim();
+        if (line.startsWith('func ')) {
+            functions.push(line);
+        }
+    }
+
+    if (functions.length > 0) {
+        structure += "Functions:\n" + functions.slice(0, 15).join('\n');
+        if (functions.length > 15) {
+            structure += `\n... and ${functions.length - 15} more functions`;
+        }
+        structure += '\n\n';
+    }
+
+    return structure;
+}
+
+/**
+ * Extract structure from Rust code
+ */
+function extractRustStructure(content: string): string {
+    const lines = content.split('\n');
+    let structure = "";
+
+    // Look for module declarations
+    const moduleLines = lines.filter(line => line.trim().startsWith('mod ') || line.trim().startsWith('use ')).slice(0, 10);
+
+    if (moduleLines.length > 0) {
+        structure += "Modules/Imports:\n" + moduleLines.join('\n') + '\n\n';
+    }
+
+    // Look for struct/enum/trait declarations
+    const types = [];
+    for (let i = 0; i < lines.length; i++) {
+        const line = lines[i].trim();
+        if (line.startsWith('struct ') || line.startsWith('enum ') || line.startsWith('trait ')) {
+            types.push(line);
+        }
+    }
+
+    if (types.length > 0) {
+        structure += "Types:\n" + types.join('\n') + '\n\n';
+    }
+
+    // Look for function/impl declarations
+    const functions = [];
+    const impls = [];
+
+    for (let i = 0; i < lines.length; i++) {
+        const line = lines[i].trim();
+        if (line.startsWith('fn ')) {
+            functions.push(line);
+        }
+        if (line.startsWith('impl ')) {
+            impls.push(line);
+        }
+    }
+
+    if (impls.length > 0) {
+        structure += "Implementations:\n" + impls.join('\n') + '\n\n';
+    }
+
+    if (functions.length > 0) {
+        structure += "Functions:\n" + functions.slice(0, 15).join('\n');
+        if (functions.length > 15) {
+            structure += `\n... and ${functions.length - 15} more functions`;
+        }
+        structure += '\n\n';
+    }
+
+    return structure;
+}
+
+/**
+ * Extract structure from HTML
+ */
+function extractHtmlStructure(content: string): string {
+    const lines = content.split('\n');
+
+    // Extract title
+    const titleMatch = content.match(/<title>(.*?)<\/title>/i);
+    const title = titleMatch ? titleMatch[1] : "No title";
+
+    // Count main elements
+    const headings = content.match(/<h[1-6].*?>.*?<\/h[1-6]>/gi) || [];
+    const divs = content.match(/<div.*?>/gi) || [];
+    const scripts = content.match(/<script.*?>.*?<\/script>/gis) || [];
+    const links = content.match(/<a.*?>.*?<\/a>/gi) || [];
+    const images = content.match(/<img.*?>/gi) || [];
+
+    // Extract some key elements
+    const structure = `HTML Document: "${title}"
+Document structure:
+- Contains ${headings.length} headings
+- Contains ${divs.length} div elements
+- Contains ${scripts.length} script blocks
+- Contains ${links.length} links
+- Contains ${images.length} images
+`;
+
+    return structure;
+}
diff --git a/src/services/llm/context/content_chunking.ts b/src/services/llm/context/content_chunking.ts
new file mode 100644
index 000000000..a9f032684
--- /dev/null
+++ b/src/services/llm/context/content_chunking.ts
@@ -0,0 +1,303 @@
+/**
+ * Contains functions for chunking content into smaller pieces for processing
+ * These functions are used to properly prepare content for LLM context windows
+ */
+
+/**
+ * Interface for chunked content
+ */
+export interface ContentChunk {
+    content: string;
+    prefix: string;
+    noteId?: string;
+    title?: string;
+    path?: string;
+    metadata?: Record<string, unknown>;
+}
+
+/**
+ * Options for the chunking process
+ */
+export interface ChunkOptions {
+    /**
+     * Maximum size of each chunk in characters
+     * Defaults to LLM context window size (typically around 2048)
+     */
+    maxChunkSize?: number;
+
+    /**
+     * How much chunks should overlap to maintain context
+     */
+    overlapSize?: number;
+
+    /**
+     * Whether to respect sentence and paragraph boundaries
+     */
+    respectBoundaries?: boolean;
+
+    /**
+     * Whether to add metadata to chunks
+     */
+    includeMetadata?: boolean;
+
+    /**
+     * Additional information to include in chunk metadata
+     */
+    metadata?: Record<string, unknown>;
+}
+
+/**
+ * Default options for chunking
+ */
+async function getDefaultChunkOptions(): Promise<Required<ChunkOptions>> {
+    // Import constants directly
+    const { LLM_CONSTANTS } = await import('../constants/provider_constants.js');
+
+    return {
+        maxChunkSize: LLM_CONSTANTS.CHUNKING.DEFAULT_SIZE,
+        overlapSize: LLM_CONSTANTS.CHUNKING.DEFAULT_OVERLAP,
+        respectBoundaries: true,
+        includeMetadata: true,
+        metadata: {}
+    };
+}
+
+/**
+ * Chunk content into smaller pieces
+ * Used for processing large documents and preparing them for LLMs
+ */
+export async function chunkContent(
+    content: string,
+    title: string = '',
+    noteId: string = '',
+    options: ChunkOptions = {}
+): Promise<ContentChunk[]> {
+    // Merge provided options with defaults
+    const defaultOptions = await getDefaultChunkOptions();
+    const config: Required<ChunkOptions> = { ...defaultOptions, ...options };
+
+    // If content is small enough, return as a single chunk
+    if (content.length <= config.maxChunkSize) {
+        return [{
+            content,
+            prefix: title,
+            noteId,
+            title,
+            metadata: config.metadata
+        }];
+    }
+
+    const chunks: ContentChunk[] = [];
+
+    if (config.respectBoundaries) {
+        // Try to split on paragraph boundaries first
+        const paragraphs = content.split(/\n\s*\n/);
+
+        let currentChunk = '';
+        let currentPrefix = title ? title : '';
+
+        for (const paragraph of paragraphs) {
+            // If adding this paragraph would exceed max size, create a new chunk
+            if (currentChunk.length + paragraph.length > config.maxChunkSize) {
+                // If current chunk is not empty, add it to chunks
+                if (currentChunk.length > 0) {
+                    chunks.push({
+                        content: currentChunk,
+                        prefix: currentPrefix,
+                        noteId,
+                        title,
+                        metadata: config.metadata
+                    });
+                }
+
+                // Start a new chunk, use the overlap if possible
+                if (config.overlapSize > 0 && currentChunk.length > 0) {
+                    // For overlap, take the last N characters
+                    const overlapText = currentChunk.slice(-config.overlapSize);
+                    currentChunk = overlapText + paragraph;
+                    currentPrefix = `${title} (continued)`;
+                } else {
+                    currentChunk = paragraph;
+                    currentPrefix = `${title} (continued)`;
+                }
+            } else {
+                // Add paragraph to current chunk
+                if (currentChunk.length > 0) {
+                    currentChunk += '\n\n';
+                }
+                currentChunk += paragraph;
+            }
+        }
+
+        // Add the last chunk if it's not empty
+        if (currentChunk.length > 0) {
+            chunks.push({
+                content: currentChunk,
+                prefix: currentPrefix,
+                noteId,
+                title,
+                metadata: config.metadata
+            });
+        }
+    } else {
+        // Simple chunking by character count
+        let currentPosition = 0;
+
+        while (currentPosition < content.length) {
+            const chunkEnd = Math.min(currentPosition + config.maxChunkSize, content.length);
+
+            const chunk = content.substring(currentPosition, chunkEnd);
+            const prefix = currentPosition === 0 ? title : `${title} (continued)`;
+
+            chunks.push({
+                content: chunk,
+                prefix,
+                noteId,
+                title,
+                metadata: config.metadata
+            });
+
+            // Move position, considering overlap
+            currentPosition = chunkEnd - (config.overlapSize || 0);
+
+            // Prevent infinite loop if overlap is too large
+            if (currentPosition <= 0 || currentPosition >= content.length) {
+                break;
+            }
+        }
+    }
+
+    return chunks;
+}
+
+/**
+ * Smarter chunking that tries to respect semantic boundaries like headers and sections
+ */
+export async function semanticChunking(
+    content: string,
+    title: string = '',
+    noteId: string = '',
+    options: ChunkOptions = {}
+): Promise<ContentChunk[]> {
+    // Merge provided options with defaults
+    const defaultOptions = await getDefaultChunkOptions();
+    const config: Required<ChunkOptions> = { ...defaultOptions, ...options };
+
+    // If content is small enough, return as a single chunk
+    if (content.length <= config.maxChunkSize) {
+        return [{
+            content,
+            prefix: title,
+            noteId,
+            title,
+            metadata: config.metadata
+        }];
+    }
+
+    const chunks: ContentChunk[] = [];
+
+    // Try to split on headers first
+    const headerPattern = /#{1,6}\s+.+|<h[1-6][^>]*>.*?<\/h[1-6]>/g;
+    const sections = [];
+
+    let lastIndex = 0;
+    let match;
+
+    // First, find all headers and split content into sections
+    while ((match = headerPattern.exec(content)) !== null) {
+        if (match.index > lastIndex) {
+            // Add the content before this header
+            sections.push(content.substring(lastIndex, match.index));
+        }
+
+        // Start a new section with this header
+        lastIndex = match.index;
+    }
+
+    // Add the last section
+    if (lastIndex < content.length) {
+        sections.push(content.substring(lastIndex));
+    }
+
+    // If no headers were found, fall back to regular chunking
+    if (sections.length <= 1) {
+        return await chunkContent(content, title, noteId, options);
+    }
+
+    // Process each section
+    let currentChunk = '';
+    let currentPrefix = title;
+
+    for (const section of sections) {
+        // If adding this section would exceed max size, create a new chunk
+        if (currentChunk.length + section.length > config.maxChunkSize) {
+            // If this single section is too big, it needs to be chunked further
+            if (section.length > config.maxChunkSize) {
+                // First add the current chunk if not empty
+                if (currentChunk.length > 0) {
+                    chunks.push({
+                        content: currentChunk,
+                        prefix: currentPrefix,
+                        noteId,
+                        title,
+                        metadata: config.metadata
+                    });
+                }
+
+                // Chunk this section separately
+                const sectionChunks = await chunkContent(
+                    section,
+                    title,
+                    noteId,
+                    options
+                );
+
+                chunks.push(...sectionChunks);
+
+                // Reset current chunk
+                currentChunk = '';
+                currentPrefix = `${title} (continued)`;
+            } else {
+                // Add current chunk to chunks
+                chunks.push({
+                    content: currentChunk,
+                    prefix: currentPrefix,
+                    noteId,
+                    title,
+                    metadata: config.metadata
+                });
+
+                // Start a new chunk with this section
+                currentChunk = section;
+                currentPrefix = `${title} (continued)`;
+            }
+        } else {
+            // Add section to current chunk
+            if (currentChunk.length > 0 && !currentChunk.endsWith('\n')) {
+                currentChunk += '\n\n';
+            }
+            currentChunk += section;
+        }
+    }
+
+    // Add the last chunk if it's not empty
+    if (currentChunk.length > 0) {
+        chunks.push({
+            content: currentChunk,
+            prefix: currentPrefix,
+            noteId,
+            title,
+            metadata: config.metadata
+        });
+    }
+
+    return chunks;
+}
+
+export interface NoteChunk {
+    noteId: string;
+    title: string;
+    content: string;
+    type?: string;
+    metadata?: Record<string, unknown>;
+}
diff --git a/src/services/llm/context/hierarchy.ts b/src/services/llm/context/hierarchy.ts
new file mode 100644
index 000000000..4ed4d5e6d
--- /dev/null
+++ b/src/services/llm/context/hierarchy.ts
@@ -0,0 +1,244 @@
+import becca from '../../../becca/becca.js';
+import { sanitizeHtmlContent } from './note_content.js';
+import { HIERARCHY_STRINGS } from '../constants/hierarchy_constants.js';
+
+/**
+ * Get a list of parent notes for a given note
+ */
+export async function getParentNotes(noteId: string, maxParents: number = 5): Promise<{id: string, title: string}[]> {
+    const note = becca.getNote(noteId);
+
+    if (!note) {
+        return [];
+    }
+
+    try {
+        // Use Becca API to get parent branches and notes
+        const parentBranches = note.getParentBranches();
+
+        if (!parentBranches || parentBranches.length === 0) {
+            return [];
+        }
+
+        // Map to get parent notes, limiting to maxParents
+        const parentNotes = parentBranches
+            .slice(0, maxParents)
+            .map(branch => {
+                if (!branch.parentNote) {
+                    return null;
+                }
+
+                return {
+                    id: branch.parentNote.noteId,
+                    title: branch.parentNote.title
+                };
+            })
+            .filter(note => note !== null) as {id: string, title: string}[];
+
+        return parentNotes;
+    } catch (error) {
+        console.error(`Error getting parent notes for ${noteId}:`, error);
+        return [];
+    }
+}
+
+/**
+ * Get hierarchical context of parent notes
+ * This function builds a representation of the note hierarchy to provide context
+ */
+export async function getParentContext(
+    noteId: string,
+    maxDepth: number = 3,
+    maxParents: number = 3,
+    includeCurrentNote: boolean = true
+): Promise<string> {
+    // Note: getParentNotes has been updated to use Becca API
+    const note = becca.getNote(noteId);
+
+    if (!note) {
+        return "";
+    }
+
+    const visited = new Set<string>();
+    let context = "";
+
+    // Helper function to build the hierarchical context recursively
+    async function buildHierarchy(currentNoteId: string, depth: number, prefix: string = ""): Promise<void> {
+        if (depth > maxDepth || visited.has(currentNoteId)) {
+            return;
+        }
+
+        visited.add(currentNoteId);
+        const parentNotes = await getParentNotes(currentNoteId, maxParents);
+
+        for (const parent of parentNotes) {
+            // Add parent with proper indentation
+            context += `${prefix}- ${parent.title}\n`;
+
+            // Recursively add parents of this parent with increased indentation
+            await buildHierarchy(parent.id, depth + 1, prefix + "  ");
+        }
+    }
+
+    // Build the hierarchy starting from the current note
+    await buildHierarchy(noteId, 1);
+
+    // Add the current note at the end with appropriate indentation
+    if (includeCurrentNote) {
+        // Determine the indentation level based on hierarchy depth
+        let indentation = "";
+        if (context) {
+            // If we have parent context, add the current note with proper indentation
+            indentation = "  ".repeat(1); // One level deeper than parents
+            context += `${indentation}> ${HIERARCHY_STRINGS.PARENT_CONTEXT.CURRENT_NOTE(note.title)}\n`;
+        } else {
+            // If no parents, just add the current note
+            context += `> ${HIERARCHY_STRINGS.PARENT_CONTEXT.CURRENT_NOTE(note.title)}\n`;
+        }
+    }
+
+    if (!context) {
+        return HIERARCHY_STRINGS.PARENT_CONTEXT.NO_PARENT_CONTEXT;
+    }
+
+    return context;
+}
+
+/**
+ * Get context from child notes
+ */
+export async function getChildContext(
+    noteId: string,
+    maxChildren: number = 10,
+    includeContent: boolean = false
+): Promise<string> {
+    const note = becca.getNote(noteId);
+
+    if (!note) {
+        return "";
+    }
+
+    try {
+        // Get child notes using Becca API
+        const childNotes = note.getChildNotes();
+
+        if (!childNotes || childNotes.length === 0) {
+            return HIERARCHY_STRINGS.CHILD_CONTEXT.NO_CHILD_NOTES;
+        }
+
+        let context = `${HIERARCHY_STRINGS.CHILD_CONTEXT.CHILD_NOTES_HEADER(childNotes.length)}\n`;
+
+        // Limit the number of children included in context
+        const limitedChildren = childNotes.slice(0, maxChildren);
+
+        for (const childNote of limitedChildren) {
+            context += `- ${childNote.title}\n`;
+
+            // Optionally include a snippet of content
+            if (includeContent) {
+                try {
+                    const content = String(await childNote.getContent() || "");
+
+                    // Truncate and sanitize content
+                    const truncatedContent = sanitizeHtmlContent(content)
+                        .substring(0, 100)
+                        .trim()
+                        .replace(/\n/g, ' ');
+
+                    if (truncatedContent) {
+                        context += `  ${HIERARCHY_STRINGS.CHILD_CONTEXT.CHILD_SUMMARY_PREFIX}${truncatedContent}${truncatedContent.length >= 100 ? '...' : ''}\n`;
+                    }
+                } catch (e) {
+                    // Silently skip content errors
+                }
+            }
+        }
+
+        // Add note about truncation if needed
+        if (childNotes.length > maxChildren) {
+            context += `${HIERARCHY_STRINGS.CHILD_CONTEXT.MORE_CHILDREN(childNotes.length - maxChildren)}\n`;
+        }
+
+        return context;
+    } catch (error) {
+        console.error(`Error getting child context for ${noteId}:`, error);
+        return HIERARCHY_STRINGS.CHILD_CONTEXT.ERROR_RETRIEVING;
+    }
+}
+
+/**
+ * Get context from linked notes (relations)
+ */
+export async function getLinkedNotesContext(
+    noteId: string,
+    maxRelations: number = 10
+): Promise<string> {
+    const note = becca.getNote(noteId);
+
+    if (!note) {
+        return "";
+    }
+
+    try {
+        // Get all relations using Becca API
+        const relations = note.getRelations();
+
+        if (!relations || relations.length === 0) {
+            return HIERARCHY_STRINGS.LINKED_NOTES.NO_LINKED_NOTES;
+        }
+
+        // Get incoming relations as well
+        const incomingRelations = note.getTargetRelations();
+
+        let context = "";
+
+        // Handle outgoing relations
+        if (relations.length > 0) {
+            context += `${HIERARCHY_STRINGS.LINKED_NOTES.OUTGOING_RELATIONS_HEADER(relations.length)}\n`;
+
+            // Limit the number of relations included in context
+            const limitedRelations = relations.slice(0, maxRelations);
+
+            for (const relation of limitedRelations) {
+                const targetNote = becca.getNote(relation.value || "");
+                if (targetNote) {
+                    const relationName = relation.name || HIERARCHY_STRINGS.LINKED_NOTES.DEFAULT_RELATION;
+                    context += `- ${relationName} → ${targetNote.title}\n`;
+                }
+            }
+
+            // Add note about truncation if needed
+            if (relations.length > maxRelations) {
+                context += `${HIERARCHY_STRINGS.LINKED_NOTES.MORE_OUTGOING(relations.length - maxRelations)}\n`;
+            }
+        }
+
+        // Handle incoming relations
+        if (incomingRelations && incomingRelations.length > 0) {
+            if (context) context += "\n";
+
+            context += `${HIERARCHY_STRINGS.LINKED_NOTES.INCOMING_RELATIONS_HEADER(incomingRelations.length)}\n`;
+
+            // Limit the number of relations included in context
+            const limitedIncoming = incomingRelations.slice(0, maxRelations);
+
+            for (const relation of limitedIncoming) {
+                const sourceNote = becca.getNote(relation.value || "");
+                if (sourceNote) {
+                    const relationName = relation.name || HIERARCHY_STRINGS.LINKED_NOTES.DEFAULT_RELATION;
+                    context += `- ${sourceNote.title} → ${relationName}\n`;
+                }
+            }
+
+            // Add note about truncation if needed
+            if (incomingRelations.length > maxRelations) {
+                context += `${HIERARCHY_STRINGS.LINKED_NOTES.MORE_INCOMING(incomingRelations.length - maxRelations)}\n`;
+            }
+        }
+
+        return context || HIERARCHY_STRINGS.LINKED_NOTES.NO_LINKED_NOTES;
+    } catch (error) {
+        console.error(`Error getting linked notes context for ${noteId}:`, error);
+        return HIERARCHY_STRINGS.LINKED_NOTES.ERROR_RETRIEVING;
+    }
+}
diff --git a/src/services/llm/context/index.ts b/src/services/llm/context/index.ts
new file mode 100644
index 000000000..258428705
--- /dev/null
+++ b/src/services/llm/context/index.ts
@@ -0,0 +1,724 @@
+/**
+ * Context extraction module for LLM features
+ * Provides methods to extract relevant context from notes for LLM processing
+ */
+
+import becca from '../../../becca/becca.js';
+import { getNoteContent, formatNoteContent, sanitizeHtmlContent } from './note_content.js';
+import { detectLanguage, extractCodeStructure } from './code_handlers.js';
+import { chunkContent, semanticChunking } from './content_chunking.js';
+import type { ContentChunk, ChunkOptions } from './content_chunking.js';
+import { summarizeContent, extractKeyPoints } from './summarization.js';
+import { getParentNotes, getParentContext, getChildContext, getLinkedNotesContext } from './hierarchy.js';
+import { SEARCH_CONSTANTS } from '../constants/search_constants.js';
+
+/**
+ * Get semantic context
+ * This is now a wrapper that redirects to the new context service
+ * @param noteId - The ID of the note to get context for
+ * @param options - Options for semantic context
+ * @returns Semantic context string
+ */
+async function getSemanticContext(
+    noteId: string,
+    options: { maxSimilarNotes?: number } = {}
+): Promise<string> {
+    // Use the context service
+    try {
+        const { default: aiServiceManager } = await import('../ai_service_manager.js');
+        const contextService = aiServiceManager.getInstance().getContextService();
+
+        if (!contextService) {
+            return "Semantic context service not available.";
+        }
+
+        // Get an LLM service
+        const llmService = aiServiceManager.getInstance().getService();
+
+        const result = await contextService.processQuery("", llmService, {
+            maxResults: options.maxSimilarNotes || 5,
+            contextNoteId: noteId
+        });
+        return result.context;
+    } catch (error) {
+        console.error("Error getting semantic context:", error);
+        return "Error retrieving semantic context.";
+    }
+}
+
+/**
+ * Options for context extraction
+ */
+export interface ContextOptions {
+    /**
+     * Include parent context
+     */
+    includeParents?: boolean;
+
+    /**
+     * Include child notes in context
+     */
+    includeChildren?: boolean;
+
+    /**
+     * Include linked notes in context
+     */
+    includeLinks?: boolean;
+
+    /**
+     * Include semantically similar notes
+     */
+    includeSimilar?: boolean;
+
+    /**
+     * Include note content in context
+     */
+    includeContent?: boolean;
+
+    /**
+     * Maximum depth for parent hierarchy
+     */
+    maxParentDepth?: number;
+
+    /**
+     * Maximum number of children to include
+     */
+    maxChildren?: number;
+
+    /**
+     * Maximum number of linked notes to include
+     */
+    maxLinks?: number;
+
+    /**
+     * Maximum number of similar notes to include
+     */
+    maxSimilarNotes?: number;
+
+    /**
+     * Maximum content length
+     */
+    maxContentLength?: number;
+}
+
+/**
+ * Default options for context extraction
+ */
+const DEFAULT_CONTEXT_OPTIONS: Required<ContextOptions> = {
+    includeParents: true,
+    includeChildren: true,
+    includeLinks: true,
+    includeSimilar: false,
+    includeContent: true,
+    maxParentDepth: SEARCH_CONSTANTS.CONTEXT.MAX_PARENT_DEPTH,
+    maxChildren: SEARCH_CONSTANTS.CONTEXT.MAX_CHILDREN,
+    maxLinks: SEARCH_CONSTANTS.CONTEXT.MAX_LINKS,
+    maxSimilarNotes: SEARCH_CONSTANTS.CONTEXT.MAX_SIMILAR_NOTES,
+    maxContentLength: SEARCH_CONSTANTS.CONTEXT.MAX_CONTENT_LENGTH
+};
+
+/**
+ * Context Extractor class
+ * Handles extraction of context from notes for LLM processing
+ */
+export class ContextExtractor {
+    /**
+     * Get content of a note
+     */
+    static async getNoteContent(noteId: string): Promise<string | null> {
+        return getNoteContent(noteId);
+    }
+
+    /**
+     * Get content of a note - instance method
+     */
+    async getNoteContent(noteId: string): Promise<string | null> {
+        return ContextExtractor.getNoteContent(noteId);
+    }
+
+    /**
+     * Format note content based on its type
+     */
+    static formatNoteContent(content: string, type: string, mime: string, title: string): string {
+        return formatNoteContent(content, type, mime, title);
+    }
+
+    /**
+     * Format note content based on its type - instance method
+     */
+    formatNoteContent(content: string, type: string, mime: string, title: string): string {
+        return ContextExtractor.formatNoteContent(content, type, mime, title);
+    }
+
+    /**
+     * Sanitize HTML content to plain text
+     */
+    static sanitizeHtmlContent(html: string): string {
+        return sanitizeHtmlContent(html);
+    }
+
+    /**
+     * Sanitize HTML content to plain text - instance method
+     */
+    sanitizeHtmlContent(html: string): string {
+        return ContextExtractor.sanitizeHtmlContent(html);
+    }
+
+    /**
+     * Detect programming language from content
+     */
+    static detectLanguage(content: string, mime: string): string {
+        return detectLanguage(content, mime);
+    }
+
+    /**
+     * Detect programming language from content - instance method
+     */
+    detectLanguage(content: string, mime: string): string {
+        return ContextExtractor.detectLanguage(content, mime);
+    }
+
+    /**
+     * Extract structure from code
+     */
+    static extractCodeStructure(content: string, language: string): string {
+        return extractCodeStructure(content, language);
+    }
+
+    /**
+     * Extract structure from code - instance method
+     */
+    extractCodeStructure(content: string, language: string): string {
+        return ContextExtractor.extractCodeStructure(content, language);
+    }
+
+    /**
+     * Chunk content into smaller pieces
+     */
+    static async chunkContent(
+        content: string,
+        title: string = '',
+        noteId: string = '',
+        options: ChunkOptions = {}
+    ): Promise<ContentChunk[]> {
+        return chunkContent(content, title, noteId, options);
+    }
+
+    /**
+     * Chunk content into smaller pieces - instance method
+     */
+    async chunkContent(
+        content: string,
+        title: string = '',
+        noteId: string = '',
+        options: ChunkOptions = {}
+    ): Promise<ContentChunk[]> {
+        return ContextExtractor.chunkContent(content, title, noteId, options);
+    }
+
+    /**
+     * Smarter chunking that respects semantic boundaries
+     */
+    static async semanticChunking(
+        content: string,
+        title: string = '',
+        noteId: string = '',
+        options: ChunkOptions = {}
+    ): Promise<ContentChunk[]> {
+        return semanticChunking(content, title, noteId, options);
+    }
+
+    /**
+     * Smarter chunking that respects semantic boundaries - instance method
+     */
+    async semanticChunking(
+        content: string,
+        title: string = '',
+        noteId: string = '',
+        options: ChunkOptions = {}
+    ): Promise<ContentChunk[]> {
+        return ContextExtractor.semanticChunking(content, title, noteId, options);
+    }
+
+    /**
+     * Summarize content
+     */
+    static summarizeContent(
+        content: string,
+        title: string = ''
+    ): string {
+        return summarizeContent(content, title);
+    }
+
+    /**
+     * Summarize content - instance method
+     */
+    summarizeContent(
+        content: string,
+        title: string = ''
+    ): string {
+        return ContextExtractor.summarizeContent(content, title);
+    }
+
+    /**
+     * Extract key points from content
+     */
+    static extractKeyPoints(
+        content: string,
+        maxPoints: number = SEARCH_CONSTANTS.CONTEXT.MAX_POINTS
+    ): string[] {
+        return extractKeyPoints(content, maxPoints);
+    }
+
+    /**
+     * Extract key points from content - instance method
+     */
+    extractKeyPoints(
+        content: string,
+        maxPoints: number = SEARCH_CONSTANTS.CONTEXT.MAX_POINTS
+    ): string[] {
+        return ContextExtractor.extractKeyPoints(content, maxPoints);
+    }
+
+    /**
+     * Get parent notes
+     */
+    static async getParentNotes(
+        noteId: string,
+        maxParents: number = SEARCH_CONSTANTS.CONTEXT.MAX_POINTS
+    ): Promise<{id: string, title: string}[]> {
+        return getParentNotes(noteId, maxParents);
+    }
+
+    /**
+     * Get parent notes - instance method
+     */
+    async getParentNotes(
+        noteId: string,
+        maxParents: number = SEARCH_CONSTANTS.CONTEXT.MAX_POINTS
+    ): Promise<{id: string, title: string}[]> {
+        return ContextExtractor.getParentNotes(noteId, maxParents);
+    }
+
+    /**
+     * Get hierarchical parent context
+     */
+    static async getParentContext(
+        noteId: string,
+        maxDepth: number = SEARCH_CONSTANTS.CONTEXT.MAX_PARENT_DEPTH,
+        maxParents: number = SEARCH_CONSTANTS.CONTEXT.MAX_PARENT_DEPTH
+    ): Promise<string> {
+        return getParentContext(noteId, maxDepth, maxParents);
+    }
+
+    /**
+     * Get hierarchical parent context - instance method
+     */
+    async getParentContext(
+        noteId: string,
+        maxDepth: number = SEARCH_CONSTANTS.CONTEXT.MAX_PARENT_DEPTH,
+        maxParents: number = SEARCH_CONSTANTS.CONTEXT.MAX_PARENT_DEPTH
+    ): Promise<string> {
+        return ContextExtractor.getParentContext(noteId, maxDepth, maxParents);
+    }
+
+    /**
+     * Get child context
+     */
+    static async getChildContext(
+        noteId: string,
+        maxChildren: number = SEARCH_CONSTANTS.CONTEXT.MAX_CHILDREN,
+        includeContent: boolean = false
+    ): Promise<string> {
+        return getChildContext(noteId, maxChildren, includeContent);
+    }
+
+    /**
+     * Get child context - instance method
+     */
+    async getChildContext(
+        noteId: string,
+        maxChildren: number = SEARCH_CONSTANTS.CONTEXT.MAX_CHILDREN,
+        includeContent: boolean = false
+    ): Promise<string> {
+        return ContextExtractor.getChildContext(noteId, maxChildren, includeContent);
+    }
+
+    /**
+     * Get linked notes context
+     */
+    static async getLinkedNotesContext(
+        noteId: string,
+        maxRelations: number = SEARCH_CONSTANTS.CONTEXT.MAX_RELATIONS
+    ): Promise<string> {
+        return getLinkedNotesContext(noteId, maxRelations);
+    }
+
+    /**
+     * Get linked notes context - instance method
+     */
+    async getLinkedNotesContext(
+        noteId: string,
+        maxRelations: number = SEARCH_CONSTANTS.CONTEXT.MAX_RELATIONS
+    ): Promise<string> {
+        return ContextExtractor.getLinkedNotesContext(noteId, maxRelations);
+    }
+
+    /**
+     * Get semantic context
+     * This is now a wrapper that redirects to the new context service
+     * @param noteId - The ID of the note to get context for
+     * @param options - Options for semantic context
+     * @returns Semantic context string
+     */
+    static async getSemanticContext(
+        noteId: string,
+        options: { maxSimilarNotes?: number } = {}
+    ): Promise<string> {
+        return getSemanticContext(noteId, options);
+    }
+
+    /**
+     * Get semantic context - instance method
+     */
+    async getSemanticContext(
+        noteId: string,
+        options: { maxSimilarNotes?: number } = {}
+    ): Promise<string> {
+        return ContextExtractor.getSemanticContext(noteId, options);
+    }
+
+    /**
+     * Extract full context for a note
+     * This combines various context sources based on provided options
+     */
+    static async extractContext(
+        noteId: string,
+        options: ContextOptions = {}
+    ): Promise<string> {
+        const config: Required<ContextOptions> = { ...DEFAULT_CONTEXT_OPTIONS, ...options };
+        const note = becca.getNote(noteId);
+
+        if (!note) {
+            return "Note not found.";
+        }
+
+        let context = `# Context for note: ${note.title}\n\n`;
+
+        // Include parent context
+        if (config.includeParents) {
+            const parentContext = await ContextExtractor.getParentContext(
+                noteId,
+                config.maxParentDepth,
+                3 // Default to 3 parents per level
+            );
+
+            if (parentContext) {
+                context += `## Parent Hierarchy\n${parentContext}\n\n`;
+            }
+        }
+
+        // Include note content
+        if (config.includeContent) {
+            const content = await ContextExtractor.getNoteContent(noteId);
+
+            if (content) {
+                // If content is too large, summarize it
+                let contentSection = '';
+
+                if (content.length > config.maxContentLength) {
+                    contentSection = ContextExtractor.summarizeContent(content, note.title);
+                    contentSection += "\n\n[Content summarized due to length]";
+                } else {
+                    contentSection = content;
+                }
+
+                context += `## Note Content\n${contentSection}\n\n`;
+            }
+        }
+
+        // Include child context
+        if (config.includeChildren) {
+            const childContext = await ContextExtractor.getChildContext(
+                noteId,
+                config.maxChildren,
+                false // Don't include child content by default
+            );
+
+            if (childContext && childContext !== "No child notes.") {
+                context += `## Child Notes\n${childContext}\n\n`;
+            }
+        }
+
+        // Include linked notes
+        if (config.includeLinks) {
+            const linkedContext = await ContextExtractor.getLinkedNotesContext(
+                noteId,
+                config.maxLinks
+            );
+
+            if (linkedContext && linkedContext !== "No linked notes.") {
+                context += `## Linked Notes\n${linkedContext}\n\n`;
+            }
+        }
+
+        // Include semantically similar notes
+        if (config.includeSimilar) {
+            const semanticContext = await ContextExtractor.getSemanticContext(
+                noteId,
+                { maxSimilarNotes: config.maxSimilarNotes }
+            );
+
+            if (semanticContext && !semanticContext.includes("No semantically similar notes found.")) {
+                context += `## Similar Notes\n${semanticContext}\n\n`;
+            }
+        }
+
+        return context;
+    }
+
+    /**
+     * Extract full context for a note - instance method
+     */
+    async extractContext(
+        noteId: string,
+        options: ContextOptions = {}
+    ): Promise<string> {
+        return ContextExtractor.extractContext(noteId, options);
+    }
+
+    /**
+     * Get progressively loaded context based on depth level
+     * This provides different levels of context detail depending on the depth parameter
+     *
+     * @param noteId - The ID of the note to get context for
+     * @param depth - Depth level (1-4) determining how much context to include
+     * @returns Context appropriate for the requested depth
+     */
+    static async getProgressiveContext(noteId: string, depth = 1): Promise<string> {
+        try {
+            const { default: aiServiceManager } = await import('../ai_service_manager.js');
+            const contextService = aiServiceManager.getInstance().getContextService();
+
+            if (!contextService) {
+                return "Context service not available.";
+            }
+
+            const results = await contextService.findRelevantNotes(
+                "", // Empty query to get general context
+                noteId,
+                { maxResults: depth * 5 }
+            );
+
+            // Format the results
+            let contextText = `Progressive context for note (depth ${depth}):\n\n`;
+            results.forEach((note, index) => {
+                contextText += `[${index + 1}] ${note.title}\n${note.content || 'No content'}\n\n`;
+            });
+
+            return contextText;
+        } catch (error) {
+            // Fall back to regular context if progressive loading fails
+            console.error('Error in progressive context loading:', error);
+            return ContextExtractor.extractContext(noteId);
+        }
+    }
+
+    /**
+     * Get progressively loaded context based on depth level - instance method
+     */
+    async getProgressiveContext(noteId: string, depth = 1): Promise<string> {
+        return ContextExtractor.getProgressiveContext(noteId, depth);
+    }
+
+    /**
+     * Get smart context based on the query complexity
+     * This automatically selects the appropriate context depth and relevance
+     *
+     * @param noteId - The ID of the note to get context for
+     * @param query - The user's query for semantic relevance matching
+     * @returns The optimal context for answering the query
+     */
+    static async getSmartContext(noteId: string, query: string): Promise<string> {
+        try {
+            const { default: aiServiceManager } = await import('../ai_service_manager.js');
+            const contextService = aiServiceManager.getInstance().getContextService();
+            const llmService = aiServiceManager.getInstance().getService();
+
+            if (!contextService) {
+                return "Context service not available.";
+            }
+
+            const result = await contextService.processQuery(
+                query,
+                llmService,
+                { contextNoteId: noteId }
+            );
+
+            return result.context;
+        } catch (error) {
+            // Fall back to regular context if smart context fails
+            console.error('Error in smart context selection:', error);
+            return ContextExtractor.extractContext(noteId);
+        }
+    }
+
+    /**
+     * Get smart context based on the query complexity - instance method
+     */
+    async getSmartContext(noteId: string, query: string): Promise<string> {
+        return ContextExtractor.getSmartContext(noteId, query);
+    }
+
+    /**
+     * Get the full context for a note, including parent hierarchy, content, and children
+     * Legacy method for backwards compatibility
+     */
+    static async getFullContext(noteId: string): Promise<string> {
+        // Use extractContext with default options
+        return ContextExtractor.extractContext(noteId);
+    }
+
+    /**
+     * Get the full context for a note - instance method
+     */
+    async getFullContext(noteId: string): Promise<string> {
+        return ContextExtractor.getFullContext(noteId);
+    }
+
+    /**
+     * Get note hierarchy information in a formatted string
+     * @param noteId - The ID of the note to get hierarchy information for
+     * @returns Formatted string with note hierarchy information
+     */
+    static async getNoteHierarchyInfo(noteId: string): Promise<string> {
+        const note = becca.getNote(noteId);
+        if (!note) return 'Note not found';
+
+        let info = `**Title**: ${note.title}\n`;
+
+        // Add attributes if any
+        const attributes = note.getAttributes();
+        if (attributes && attributes.length > 0) {
+            const relevantAttrs = attributes.filter(attr => !attr.name.startsWith('_'));
+            if (relevantAttrs.length > 0) {
+                info += `**Attributes**: ${relevantAttrs.map(attr => `${attr.name}=${attr.value}`).join(', ')}\n`;
+            }
+        }
+
+        // Add parent path
+        const parents = await ContextExtractor.getParentNotes(noteId);
+        if (parents && parents.length > 0) {
+            const path = parents.map(p => p.title).join(' > ');
+            info += `**Path**: ${path}\n`;
+        }
+
+        // Add child count
+        const childNotes = note.getChildNotes();
+        if (childNotes && childNotes.length > 0) {
+            info += `**Child notes**: ${childNotes.length}\n`;
+
+            // List first few child notes
+            const childList = childNotes.slice(0, 5).map(child => child.title).join(', ');
+            if (childList) {
+                info += `**Examples**: ${childList}${childNotes.length > 5 ? '...' : ''}\n`;
+            }
+        }
+
+        // Add note type
+        if (note.type) {
+            info += `**Type**: ${note.type}\n`;
+        }
+
+        // Add creation/modification dates
+        if (note.utcDateCreated) {
+            info += `**Created**: ${new Date(note.utcDateCreated).toLocaleString()}\n`;
+        }
+
+        if (note.utcDateModified) {
+            info += `**Modified**: ${new Date(note.utcDateModified).toLocaleString()}\n`;
+        }
+
+        return info;
+    }
+
+    /**
+     * Get note hierarchy information - instance method
+     */
+    async getNoteHierarchyInfo(noteId: string): Promise<string> {
+        return ContextExtractor.getNoteHierarchyInfo(noteId);
+    }
+
+    /**
+     * Get note summary - for backward compatibility
+     */
+    static async getNoteSummary(noteId: string, maxLength = 5000): Promise<string> {
+        const note = becca.getNote(noteId);
+        if (!note) return '';
+
+        const content = await getNoteContent(noteId);
+        if (!content || content.length < maxLength) return content || '';
+
+        // For larger content, generate a summary
+        return summarizeContent(content, note.title);
+    }
+
+    /**
+     * Get note summary - instance method
+     */
+    async getNoteSummary(noteId: string, maxLength = 5000): Promise<string> {
+        return ContextExtractor.getNoteSummary(noteId, maxLength);
+    }
+
+    /**
+     * Split a large note into smaller, semantically meaningful chunks
+     * This is useful for handling large notes that exceed the context window of LLMs
+     * For backward compatibility
+     */
+    static async getChunkedNoteContent(noteId: string, maxChunkSize = 2000): Promise<string[]> {
+        const content = await getNoteContent(noteId);
+        if (!content) return [];
+
+        // Use the new chunking functionality
+        const chunks = await ContextExtractor.chunkContent(
+            content,
+            '',
+            noteId,
+            { maxChunkSize, respectBoundaries: true }
+        );
+
+        // Convert to the old API format which was an array of strings
+        return (await chunks).map(chunk => chunk.content);
+    }
+
+    /**
+     * Split a large note into smaller chunks - instance method
+     */
+    async getChunkedNoteContent(noteId: string, maxChunkSize = 2000): Promise<string[]> {
+        return ContextExtractor.getChunkedNoteContent(noteId, maxChunkSize);
+    }
+}
+
+// Export all modules
+export {
+    getNoteContent,
+    formatNoteContent,
+    sanitizeHtmlContent,
+    detectLanguage,
+    extractCodeStructure,
+    chunkContent,
+    semanticChunking,
+    summarizeContent,
+    extractKeyPoints,
+    getParentNotes,
+    getParentContext,
+    getChildContext,
+    getLinkedNotesContext,
+    getSemanticContext
+};
+
+// Export types
+export type {
+    ContentChunk,
+    ChunkOptions
+};
diff --git a/src/services/llm/context/modules/cache_manager.ts b/src/services/llm/context/modules/cache_manager.ts
new file mode 100644
index 000000000..540a23a19
--- /dev/null
+++ b/src/services/llm/context/modules/cache_manager.ts
@@ -0,0 +1,117 @@
+import log from '../../../log.js';
+import type { ICacheManager, CachedNoteData, CachedQueryResults } from '../../interfaces/context_interfaces.js';
+
+/**
+ * Manages caching for context services
+ * Provides a centralized caching system to avoid redundant operations
+ */
+export class CacheManager implements ICacheManager {
+    // Cache for recently used context to avoid repeated embedding lookups
+    private noteDataCache = new Map<string, CachedNoteData<unknown>>();
+
+    // Cache for recently used queries
+    private queryCache = new Map<string, CachedQueryResults<unknown>>();
+
+    // Default cache expiry (5 minutes)
+    private defaultCacheExpiryMs = 5 * 60 * 1000;
+
+    constructor() {
+        this.setupCacheCleanup();
+    }
+
+    /**
+     * Set up periodic cache cleanup
+     */
+    private setupCacheCleanup() {
+        setInterval(() => {
+            this.cleanupCache();
+        }, 60000); // Run cleanup every minute
+    }
+
+    /**
+     * Clean up expired cache entries
+     */
+    cleanupCache() {
+        const now = Date.now();
+
+        // Clean note data cache
+        for (const [key, data] of this.noteDataCache.entries()) {
+            if (now - data.timestamp > this.defaultCacheExpiryMs) {
+                this.noteDataCache.delete(key);
+            }
+        }
+
+        // Clean query cache
+        for (const [key, data] of this.queryCache.entries()) {
+            if (now - data.timestamp > this.defaultCacheExpiryMs) {
+                this.queryCache.delete(key);
+            }
+        }
+    }
+
+    /**
+     * Get cached note data
+     */
+    getNoteData<T>(noteId: string, type: string): T | null {
+        const key = `${noteId}:${type}`;
+        const cached = this.noteDataCache.get(key);
+
+        if (cached && Date.now() - cached.timestamp < this.defaultCacheExpiryMs) {
+            log.info(`Cache hit for note data: ${key}`);
+            return cached.data as T;
+        }
+
+        return null;
+    }
+
+    /**
+     * Store note data in cache
+     */
+    storeNoteData<T>(noteId: string, type: string, data: T): void {
+        const key = `${noteId}:${type}`;
+        this.noteDataCache.set(key, {
+            timestamp: Date.now(),
+            data
+        });
+        log.info(`Cached note data: ${key}`);
+    }
+
+    /**
+     * Get cached query results
+     */
+    getQueryResults<T>(query: string, contextNoteId: string | null = null): T | null {
+        const key = JSON.stringify({ query, contextNoteId });
+        const cached = this.queryCache.get(key);
+
+        if (cached && Date.now() - cached.timestamp < this.defaultCacheExpiryMs) {
+            log.info(`Cache hit for query: ${query}`);
+            return cached.results as T;
+        }
+
+        return null;
+    }
+
+    /**
+     * Store query results in cache
+     */
+    storeQueryResults<T>(query: string, results: T, contextNoteId: string | null = null): void {
+        const key = JSON.stringify({ query, contextNoteId });
+        this.queryCache.set(key, {
+            timestamp: Date.now(),
+            results
+        });
+        log.info(`Cached query results: ${query}`);
+    }
+
+    /**
+     * Clear all caches
+     */
+    clearAllCaches(): void {
+        this.noteDataCache.clear();
+        this.queryCache.clear();
+        log.info('All context caches cleared');
+    }
+}
+
+// Export singleton instance
+export default new CacheManager();
diff --git a/src/services/llm/context/modules/context_formatter.ts b/src/services/llm/context/modules/context_formatter.ts
new file mode 100644
index 000000000..80f1addaa
--- /dev/null
+++ b/src/services/llm/context/modules/context_formatter.ts
@@ -0,0 +1,322 @@
+import sanitizeHtml from 'sanitize-html';
+import log from '../../../log.js';
+import { CONTEXT_PROMPTS, FORMATTING_PROMPTS } from '../../constants/llm_prompt_constants.js';
+import { LLM_CONSTANTS } from '../../constants/provider_constants.js';
+import type { IContextFormatter, NoteSearchResult } from '../../interfaces/context_interfaces.js';
+import modelCapabilitiesService from '../../model_capabilities_service.js';
+import { calculateAvailableContextSize } from '../../interfaces/model_capabilities.js';
+import type { Message } from '../../ai_interface.js';
+
+// Use constants from the centralized file
+// const CONTEXT_WINDOW = {
+//     OPENAI: 16000,
+//     ANTHROPIC: 100000,
+//     OLLAMA: 4000,  // Reduced to avoid issues
+//     DEFAULT: 4000
+// };
+
+/**
+ * Formats context data for LLM consumption
+ *
+ * This service is responsible for formatting note data into a structured
+ * format that can be efficiently processed by the LLM.
+ */
+export class ContextFormatter implements IContextFormatter {
+    /**
+     * Build formatted context from a list of note search results
+     *
+     * @param sources Array of note data with content and metadata
+     * @param query The user's query for context
+     * @param providerId Optional provider ID to customize formatting
+     * @param messages Optional conversation messages to adjust context size
+     * @returns Formatted context string
+     */
+    async buildContextFromNotes(
+        sources: NoteSearchResult[],
+        query: string,
+        providerId: string = 'default',
+        messages: Message[] = []
+    ): Promise<string> {
+        if (!sources || sources.length === 0) {
+            log.info('No sources provided to context formatter');
+            return CONTEXT_PROMPTS.NO_NOTES_CONTEXT;
+        }
+
+        try {
+            // Get model name from provider
+            let modelName = providerId;
+
+            // Look up model capabilities
+            const modelCapabilities = await modelCapabilitiesService.getModelCapabilities(modelName);
+
+            // Calculate available context size for this conversation
+            const availableContextSize = calculateAvailableContextSize(
+                modelCapabilities,
+                messages,
+                3 // Expected additional turns
+            );
+
+            // Use the calculated size or fall back to constants
+            const maxTotalLength = availableContextSize || (
+                providerId === 'openai' ? LLM_CONSTANTS.CONTEXT_WINDOW.OPENAI :
+                providerId === 'anthropic' ? LLM_CONSTANTS.CONTEXT_WINDOW.ANTHROPIC :
+                providerId === 'ollama' ? LLM_CONSTANTS.CONTEXT_WINDOW.OLLAMA :
+                LLM_CONSTANTS.CONTEXT_WINDOW.DEFAULT
+            );
+
+            // DEBUG: Log context window size
+            log.info(`Context window for provider ${providerId}: ${maxTotalLength} chars`);
+            log.info(`Building context from notes with query: ${query}`);
+            log.info(`Sources length: ${sources.length}`);
+
+            // Use provider-specific formatting
+            let formattedContext = '';
+
+            if (providerId === 'ollama') {
+                // For Ollama, use a much simpler plain text format that's less prone to encoding issues
+                formattedContext = FORMATTING_PROMPTS.CONTEXT_HEADERS.SIMPLE(query);
+            } else if (providerId === 'anthropic') {
+                formattedContext = CONTEXT_PROMPTS.CONTEXT_HEADERS.ANTHROPIC(query);
+            } else {
+                formattedContext = CONTEXT_PROMPTS.CONTEXT_HEADERS.DEFAULT(query);
+            }
+
+            // Sort sources by similarity if available to prioritize most relevant
+            if (sources[0] && sources[0].similarity !== undefined) {
+                sources = [...sources].sort((a, b) => (b.similarity || 0) - (a.similarity || 0));
+                // Log sorting information
+                log.info(`Sources sorted by similarity. Top sources: ${sources.slice(0, 3).map(s => s.title || 'Untitled').join(', ')}`);
+            }
+
+            // Track total size to avoid exceeding model context window
+            let totalSize = formattedContext.length;
+            const formattedSources: string[] = [];
+
+            // Track stats for logging
+            let sourcesProcessed = 0;
+            let sourcesIncluded = 0;
+            let sourcesSkipped = 0;
+            let sourcesExceededLimit = 0;
+
+            // Process each source
+            for (const source of sources) {
+                sourcesProcessed++;
+                let content = '';
+                let title = 'Untitled Note';
+
+                if (typeof source === 'string') {
+                    content = source;
+                } else if (source.content) {
+                    // For Ollama, use a more aggressive sanitization to avoid encoding issues
+                    if (providerId === 'ollama') {
+                        content = this.sanitizeForOllama(source.content);
+                    } else {
+                        content = this.sanitizeNoteContent(source.content, source.type, source.mime);
+                    }
+                    title = source.title || title;
+                } else {
+                    sourcesSkipped++;
+                    log.info(`Skipping note with no content: ${source.title || 'Untitled'}`);
+                    continue; // Skip invalid sources
+                }
+
+                // Skip if content is empty or just whitespace/minimal
+                if (!content || content.trim().length <= 10) {
+                    sourcesSkipped++;
+                    log.info(`Skipping note with minimal content: ${title}`);
+                    continue;
+                }
+
+                // Format source with title - use simple format for Ollama
+                let formattedSource = '';
+                if (providerId === 'ollama') {
+                    // For Ollama, use a simpler format and plain ASCII
+                    formattedSource = `<note>\n${FORMATTING_PROMPTS.DIVIDERS.NOTE_START}${title}\n${content}\n</note>\n\n`;
+                } else {
+                    formattedSource = `<note>\n### ${title}\n${content}\n</note>\n\n`;
+                }
+
+                // Check if adding this would exceed our size limit
+                if (totalSize + formattedSource.length > maxTotalLength) {
+                    sourcesExceededLimit++;
+                    // If this is the first source, include a truncated version
+                    if (formattedSources.length === 0) {
+                        const availableSpace = maxTotalLength - totalSize - 100; // Buffer for closing text
+                        if (availableSpace > 200) { // Only if we have reasonable space
+                            const truncatedContent = providerId === 'ollama' ?
+                                `<note>\n## ${title}\n${content.substring(0, availableSpace)}...\n</note>\n\n` :
+                                `<note>\n### ${title}\n${content.substring(0, availableSpace)}...\n</note>\n\n`;
+                            formattedSources.push(truncatedContent);
+                            totalSize += truncatedContent.length;
+                            sourcesIncluded++;
+                            log.info(`Truncated first source "${title}" to fit in context window`);
+                        }
+                    }
+                    break;
+                }
+
+                formattedSources.push(formattedSource);
+                totalSize += formattedSource.length;
+                sourcesIncluded++;
+            }
+
+            // Log sources stats
+            log.info(`Context building stats: processed ${sourcesProcessed}/${sources.length} sources, included ${sourcesIncluded}, skipped ${sourcesSkipped}, exceeded limit ${sourcesExceededLimit}`);
+            log.info(`Context size so far: ${totalSize}/${maxTotalLength} chars (${(totalSize/maxTotalLength*100).toFixed(2)}% of limit)`);
+
+            // Add the formatted sources to the context
+            formattedContext += formattedSources.join('');
+
+            // Add closing to provide instructions to the AI - use simpler version for Ollama
+            let closing = '';
+            if (providerId === 'ollama') {
+                closing = `\n\n${FORMATTING_PROMPTS.CONTEXT_CLOSERS.SIMPLE}`;
+            } else if (providerId === 'anthropic') {
+                closing = CONTEXT_PROMPTS.CONTEXT_CLOSINGS.ANTHROPIC;
+            } else {
+                closing = CONTEXT_PROMPTS.CONTEXT_CLOSINGS.DEFAULT;
+            }
+
+            // Check if adding the closing would exceed our limit
+            if (totalSize + closing.length <= maxTotalLength) {
+                formattedContext += closing;
+            }
+
+            // Log final context size
+            log.info(`Final context: ${formattedContext.length} chars, ${formattedSources.length} sources included`);
+
+            // DEBUG: Log a sample of the formatted context to verify <note> tags are present
+            log.info(`Context sample (first 500 chars): ${formattedContext.substring(0, 500).replace(/\n/g, '\\n')}`);
+            log.info(`Context sample (last 500 chars): ${formattedContext.substring(Math.max(0, formattedContext.length - 500)).replace(/\n/g, '\\n')}`);
+
+            return formattedContext;
+        } catch (error) {
+            log.error(`Error building context from notes: ${error}`);
+            return CONTEXT_PROMPTS.ERROR_FALLBACK_CONTEXT;
+        }
+    }
+
+    /**
+     * Sanitize note content for inclusion in context
+     *
+     * @param content - Raw note content
+     * @param type - Note type (text, code, etc.)
+     * @param mime - Note mime type
+     * @returns Sanitized content
+     */
+    sanitizeNoteContent(content: string, type?: string, mime?: string): string {
+        if (!content) {
+            return '';
+        }
+
+        try {
+            // If it's HTML content, sanitize it
+            if (mime === 'text/html' || type === 'text') {
+                // First, try to preserve some structure by converting to markdown-like format
+                const contentWithMarkdown = content
+                    // Convert headers
+                    .replace(/<h1[^>]*>(.*?)<\/h1>/gi, '# $1\n')
+                    .replace(/<h2[^>]*>(.*?)<\/h2>/gi, '## $1\n')
+                    .replace(/<h3[^>]*>(.*?)<\/h3>/gi, '### $1\n')
+                    .replace(/<h4[^>]*>(.*?)<\/h4>/gi, '#### $1\n')
+                    .replace(/<h5[^>]*>(.*?)<\/h5>/gi, '##### $1\n')
+                    // Convert lists
+                    .replace(/<\/?ul[^>]*>/g, '\n')
+                    .replace(/<\/?ol[^>]*>/g, '\n')
+                    .replace(/<li[^>]*>(.*?)<\/li>/gi, '- $1\n')
+                    // Convert links
+                    .replace(/<a[^>]*href=["'](.*?)["'][^>]*>(.*?)<\/a>/gi, '[$2]($1)')
+                    // Convert code blocks
+                    .replace(/<pre[^>]*><code[^>]*>(.*?)<\/code><\/pre>/gis, '```\n$1\n```')
+                    .replace(/<code[^>]*>(.*?)<\/code>/gi, '`$1`')
+                    // Convert emphasis
+                    .replace(/<strong[^>]*>(.*?)<\/strong>/gi, '**$1**')
+                    .replace(/<b[^>]*>(.*?)<\/b>/gi, '**$1**')
+                    .replace(/<em[^>]*>(.*?)<\/em>/gi, '*$1*')
+                    .replace(/<i[^>]*>(.*?)<\/i>/gi, '*$1*')
+                    // Handle paragraphs better
+                    .replace(/<p[^>]*>(.*?)<\/p>/gi, '$1\n\n')
+                    // Handle line breaks
+                    .replace(/<br\s*\/?>/gi, '\n');
+
+                // Then use sanitize-html to remove remaining HTML
+                const sanitized = sanitizeHtml(contentWithMarkdown, {
+                    allowedTags: [], // No tags allowed (strip all HTML)
+                    allowedAttributes: {}, // No attributes allowed
+                    textFilter: function(text) {
+                        return text
+                            .replace(/&nbsp;/g, ' ')
+                            .replace(/&lt;/g, '<')
+                            .replace(/&gt;/g, '>')
+                            .replace(/&quot;/g, '"')
+                            .replace(/&amp;/g, '&')
+                            .replace(/\n\s*\n\s*\n/g, '\n\n'); // Replace multiple blank lines with just one
+                    }
+                });
+
+                // Remove unnecessary whitespace while preserving meaningful structure
+                return sanitized
+                    .replace(/\n{3,}/g, '\n\n')  // no more than 2 consecutive newlines
+                    .trim();
+            }
+
+            // If it's code, keep formatting but limit size
+            if (type === 'code' || mime?.includes('application/')) {
+                // For code, limit to a reasonable size
+                if (content.length > 2000) {
+                    return content.substring(0, 2000) + '...\n\n[Content truncated for brevity]';
+                }
+                return content;
+            }
+
+            // For all other types, just return as is
+            return content;
+        } catch (error) {
+            log.error(`Error sanitizing note content: ${error}`);
+            return content; // Return original content if sanitization fails
+        }
+    }
+
+    /**
+     * Special sanitization for Ollama that removes all non-ASCII characters
+     * and simplifies formatting to avoid encoding issues
+     */
+    sanitizeForOllama(content: string): string {
+        if (!content) {
+            return '';
+        }
+
+        try {
+            // First remove any HTML
+            let plaintext = sanitizeHtml(content, {
+                allowedTags: [],
+                allowedAttributes: {},
+                textFilter: (text) => text
+            });
+
+            // Then aggressively sanitize to plain ASCII and simple formatting
+            plaintext = plaintext
+                // Replace common problematic quotes with simple ASCII quotes
+                .replace(/[""]/g, '"')
+                .replace(/['']/g, "'")
+                // Replace other common Unicode characters
+                .replace(/[–—]/g, '-')
+                .replace(/[•]/g, '*')
+                .replace(/[…]/g, '...')
+                // Strip all non-ASCII characters
+                .replace(/[^\x00-\x7F]/g, '')
+                // Normalize whitespace
+                .replace(/\s+/g, ' ')
+                .replace(/\n\s+/g, '\n')
+                .trim();
+
+            return plaintext;
+        } catch (error) {
+            log.error(`Error sanitizing note content for Ollama: ${error}`);
+            return ''; // Return empty if sanitization fails
+        }
+    }
+}
+
+// Export singleton instance
+export default new ContextFormatter();
diff --git a/src/services/llm/context/modules/provider_manager.ts b/src/services/llm/context/modules/provider_manager.ts
new file mode 100644
index 000000000..8030e3592
--- /dev/null
+++ b/src/services/llm/context/modules/provider_manager.ts
@@ -0,0 +1,102 @@
+import options from '../../../options.js';
+import log from '../../../log.js';
+import { getEmbeddingProvider, getEnabledEmbeddingProviders } from '../../providers/providers.js';
+
+/**
+ * Manages embedding providers for context services
+ */
+export class ProviderManager {
+    /**
+     * Get the preferred embedding provider based on user settings
+     * Tries to use the most appropriate provider in this order:
+     * 1. User's configured default provider
+     * 2. OpenAI if API key is set
+     * 3. Anthropic if API key is set
+     * 4. Ollama if configured
+     * 5. Any available provider
+     * 6. Local provider as fallback
+     *
+     * @returns The preferred embedding provider or null if none available
+     */
+    async getPreferredEmbeddingProvider(): Promise<any> {
+        try {
+            // Try to get providers based on precedence list
+            const precedenceOption = await options.getOption('embeddingProviderPrecedence');
+            let precedenceList: string[] = [];
+
+            if (precedenceOption) {
+                if (precedenceOption.startsWith('[') && precedenceOption.endsWith(']')) {
+                    precedenceList = JSON.parse(precedenceOption);
+                } else if (typeof precedenceOption === 'string') {
+                    if (precedenceOption.includes(',')) {
+                        precedenceList = precedenceOption.split(',').map(p => p.trim());
+                    } else {
+                        precedenceList = [precedenceOption];
+                    }
+                }
+            }
+
+            // Try each provider in the precedence list
+            for (const providerId of precedenceList) {
+                const provider = await getEmbeddingProvider(providerId);
+                if (provider) {
+                    log.info(`Using embedding provider from precedence list: ${providerId}`);
+                    return provider;
+                }
+            }
+
+            // If no provider from precedence list is available, try any enabled provider
+            const providers = await getEnabledEmbeddingProviders();
+            if (providers.length > 0) {
+                log.info(`Using available embedding provider: ${providers[0].name}`);
+                return providers[0];
+            }
+
+            // Last resort is local provider
+            log.info('Using local embedding provider as fallback');
+            return await getEmbeddingProvider('local');
+        } catch (error) {
+            log.error(`Error getting preferred embedding provider: ${error}`);
+            return null;
+        }
+    }
+
+    /**
+     * Generate embeddings for a text query
+     *
+     * @param query - The text query to embed
+     * @returns The generated embedding or null if failed
+     */
+    async generateQueryEmbedding(query: string): Promise<Float32Array | null> {
+        try {
+            // Get the preferred embedding provider
+            const provider = await this.getPreferredEmbeddingProvider();
+            if (!provider) {
+                log.error('No embedding provider available');
+                return null;
+            }
+
+            // Generate the embedding
+            const embedding = await provider.generateEmbeddings(query);
+
+            if (embedding) {
+                // Add the original query as a property to the embedding
+                // This is used for title matching in the vector search
+                Object.defineProperty(embedding, 'originalQuery', {
+                    value: query,
+                    writable: false,
+                    enumerable: true,
+                    configurable: false
+                });
+            }
+
+            return embedding;
+        } catch (error) {
+            log.error(`Error generating query embedding: ${error}`);
+            return null;
+        }
+    }
+}
+
+// Export singleton instance
+export default new ProviderManager();
diff --git a/src/services/llm/context/note_content.ts b/src/services/llm/context/note_content.ts
new file mode 100644
index 000000000..575aaadd2
--- /dev/null
+++ b/src/services/llm/context/note_content.ts
@@ -0,0 +1,287 @@
+import sanitizeHtml from 'sanitize-html';
+import becca from '../../../becca/becca.js';
+
+// Define interfaces for JSON structures
+interface CanvasElement {
+    type: string;
+    text?: string;
+
+}
+
+interface CanvasContent {
+    elements?: CanvasElement[];
+
+}
+
+interface MindMapNode {
+    text?: string;
+    children?: MindMapNode[];
+
+}
+
+interface MindMapContent {
+    root?: MindMapNode;
+
+}
+
+interface RelationMapNote {
+    noteId: string;
+    title?: string;
+    name?: string;
+
+}
+
+interface RelationMapRelation {
+    sourceNoteId: string;
+    targetNoteId: string;
+    name?: string;
+
+}
+
+interface RelationMapContent {
+    notes?: RelationMapNote[];
+    relations?: RelationMapRelation[];
+
+}
+
+interface GeoMapMarker {
+    title?: string;
+    lat: number;
+    lng: number;
+    description?: string;
+
+}
+
+interface GeoMapContent {
+    markers?: GeoMapMarker[];
+
+}
+
+interface ErrorWithMessage {
+    message: string;
+}
+
+/**
+ * Get the content of a note
+ */
+export async function getNoteContent(noteId: string): Promise<string | null> {
+    // Use Becca API to get note data
+    const note = becca.getNote(noteId);
+
+    if (!note) {
+        return null;
+    }
+
+    try {
+        // Get content using Becca API
+        const content = String(await note.getContent() || "");
+
+        return formatNoteContent(
+            content,
+            note.type,
+            note.mime,
+            note.title
+        );
+    } catch (error) {
+        console.error(`Error getting content for note ${noteId}:`, error);
+        return null;
+    }
+}
+
+/**
+ * Format the content of a note based on its type
+ * Enhanced with better handling for large and specialized content types
+ */
+export function formatNoteContent(content: string, type: string, mime: string, title: string): string {
+    let formattedContent = `# ${title}\n\n`;
+
+    switch (type) {
+        case 'text':
+            // Remove HTML formatting for text notes
+            formattedContent += sanitizeHtml(content);
+            break;
+
+        case 'code':
+            // For code, we'll handle this in code_handlers.ts
+            // Just use basic formatting here
+            formattedContent += '```\n' + content + '\n```';
+            break;
+
+        case 'canvas':
+            if (mime === 'application/json') {
+                try {
+                    // Parse JSON content
+                    const jsonContent = JSON.parse(content) as CanvasContent;
+
+                    // Extract text elements from canvas
+                    if (jsonContent.elements && Array.isArray(jsonContent.elements)) {
+                        const texts = jsonContent.elements
+                            .filter((element) => element.type === 'text' && element.text)
+                            .map((element) => element.text as string);
+
+                        formattedContent += 'Canvas content:\n' + texts.join('\n');
+                    } else {
+                        formattedContent += '[Empty canvas]';
+                    }
+                }
+                catch (e) {
+                    const error = e as ErrorWithMessage;
+                    formattedContent += `[Error parsing canvas content: ${error.message}]`;
+                }
+            } else {
+                formattedContent += '[Canvas content]';
+            }
+            break;
+
+        case 'mindMap':
+            if (mime === 'application/json') {
+                try {
+                    // Parse JSON content
+                    const jsonContent = JSON.parse(content) as MindMapContent;
+
+                    // Extract node text from mind map
+                    const extractMindMapNodes = (node: MindMapNode): string[] => {
+                        let texts: string[] = [];
+                        if (node.text) {
+                            texts.push(node.text);
+                        }
+                        if (node.children && Array.isArray(node.children)) {
+                            for (const child of node.children) {
+                                texts = texts.concat(extractMindMapNodes(child));
+                            }
+                        }
+                        return texts;
+                    };
+
+                    if (jsonContent.root) {
+                        formattedContent += 'Mind map content:\n' + extractMindMapNodes(jsonContent.root).join('\n');
+                    } else {
+                        formattedContent += '[Empty mind map]';
+                    }
+                }
+                catch (e) {
+                    const error = e as ErrorWithMessage;
+                    formattedContent += `[Error parsing mind map content: ${error.message}]`;
+                }
+            } else {
+                formattedContent += '[Mind map content]';
+            }
+            break;
+
+        case 'relationMap':
+            if (mime === 'application/json') {
+                try {
+                    // Parse JSON content
+                    const jsonContent = JSON.parse(content) as RelationMapContent;
+
+                    // Extract relation map entities and connections
+                    let result = 'Relation map content:\n';
+
+                    if (jsonContent.notes && Array.isArray(jsonContent.notes)) {
+                        result += 'Notes: ' + jsonContent.notes
+                            .map((note) => note.title || note.name)
+                            .filter(Boolean)
+                            .join(', ') + '\n';
+                    }
+
+                    if (jsonContent.relations && Array.isArray(jsonContent.relations)) {
+                        result += 'Relations: ' + jsonContent.relations
+                            .map((rel) => {
+                                const sourceNote = jsonContent.notes?.find((n) => n.noteId === rel.sourceNoteId);
+                                const targetNote = jsonContent.notes?.find((n) => n.noteId === rel.targetNoteId);
+                                const source = sourceNote ? (sourceNote.title || sourceNote.name) : 'unknown';
+                                const target = targetNote ? (targetNote.title || targetNote.name) : 'unknown';
+                                return `${source} → ${rel.name || ''} → ${target}`;
+                            })
+                            .join('; ');
+                    }
+
+                    formattedContent += result;
+                }
+                catch (e) {
+                    const error = e as ErrorWithMessage;
+                    formattedContent += `[Error parsing relation map content: ${error.message}]`;
+                }
+            } else {
+                formattedContent += '[Relation map content]';
+            }
+            break;
+
+        case 'geoMap':
+            if (mime === 'application/json') {
+                try {
+                    // Parse JSON content
+                    const jsonContent = JSON.parse(content) as GeoMapContent;
+
+                    let result = 'Geographic map content:\n';
+
+                    if (jsonContent.markers && Array.isArray(jsonContent.markers)) {
+                        if (jsonContent.markers.length > 0) {
+                            result += jsonContent.markers
+                                .map((marker) => {
+                                    return `Location: ${marker.title || ''} (${marker.lat}, ${marker.lng})${marker.description ? ' - ' + marker.description : ''}`;
+                                })
+                                .join('\n');
+                        } else {
+                            result += 'Empty geographic map';
+                        }
+                    } else {
+                        result += 'Empty geographic map';
+                    }
+
+                    formattedContent += result;
+                }
+                catch (e) {
+                    const error = e as ErrorWithMessage;
+                    formattedContent += `[Error parsing geographic map content: ${error.message}]`;
+                }
+            } else {
+                formattedContent += '[Geographic map content]';
+            }
+            break;
+
+        case 'mermaid':
+            // Format mermaid diagrams as code blocks
+            formattedContent += '```mermaid\n' + content + '\n```';
+            break;
+
+        case 'image':
+        case 'file':
+            formattedContent += `[${type} attachment]`;
+            break;
+
+        default:
+            // For other notes, just use the content as is
+            formattedContent += sanitizeHtml(content);
+    }
+
+    return formattedContent;
+}
+
+/**
+ * Sanitize HTML content to plain text
+ */
+export function sanitizeHtmlContent(html: string): string {
+    if (!html) return '';
+
+    // Use sanitizeHtml to remove all HTML tags
+    let content = sanitizeHtml(html, {
+        allowedTags: [],
+        allowedAttributes: {},
+        textFilter: (text) => {
+            // Replace multiple newlines with a single one
+            return text.replace(/\n\s*\n/g, '\n\n');
+        }
+    });
+
+    // Additional cleanup for any remaining HTML entities
+    content = content
+        .replace(/&nbsp;/g, ' ')
+        .replace(/&lt;/g, '<')
+        .replace(/&gt;/g, '>')
+        .replace(/&quot;/g, '"')
+        .replace(/&#39;/g, "'")
+        .replace(/&amp;/g, '&');
+
+    return content;
+}
diff --git a/src/services/llm/context/services/context_service.ts b/src/services/llm/context/services/context_service.ts
new file mode 100644
index 000000000..a227c3936
--- /dev/null
+++ b/src/services/llm/context/services/context_service.ts
@@ -0,0 +1,348 @@
+/**
+ * Unified Context Service
+ *
+ * Consolidates functionality from:
+ * - context_service.ts (old version)
+ * - semantic_search.ts
+ * - vector_search_stage.ts
+ *
+ * This service provides a central interface for all context extraction operations,
+ * supporting both full and summarized note content extraction.
+ */
+
+import log from '../../../log.js';
+import providerManager from '../modules/provider_manager.js';
+import cacheManager from '../modules/cache_manager.js';
+import vectorSearchService from './vector_search_service.js';
+import queryProcessor from './query_processor.js';
+import contextFormatter from '../modules/context_formatter.js';
+import aiServiceManager from '../../ai_service_manager.js';
+import { ContextExtractor } from '../index.js';
+import { CONTEXT_PROMPTS } from '../../constants/llm_prompt_constants.js';
+import type { NoteSearchResult } from '../../interfaces/context_interfaces.js';
+import type { LLMServiceInterface } from '../../interfaces/agent_tool_interfaces.js';
+
+// Options for context processing
+export interface ContextOptions {
+    // Content options
+    summarizeContent?: boolean;
+    maxResults?: number;
+    contextNoteId?: string | null;
+
+    // Processing options
+    useQueryEnhancement?: boolean;
+    useQueryDecomposition?: boolean;
+
+    // Debugging options
+    showThinking?: boolean;
+}
+
+export class ContextService {
+    private initialized = false;
+    private initPromise: Promise<void> | null = null;
+    private contextExtractor: ContextExtractor;
+
+    constructor() {
+        this.contextExtractor = new ContextExtractor();
+    }
+
+    /**
+     * Initialize the service
+     */
+    async initialize(): Promise<void> {
+        if (this.initialized) return;
+
+        // Use a promise to prevent multiple simultaneous initializations
+        if (this.initPromise) return this.initPromise;
+
+        this.initPromise = (async () => {
+            try {
+                // Initialize provider
+                const provider = await providerManager.getPreferredEmbeddingProvider();
+                if (!provider) {
+                    throw new Error(`No embedding provider available. Could not initialize context service.`);
+                }
+
+                // Agent tools are already initialized in the AIServiceManager constructor
+                // No need to initialize them again
+
+                this.initialized = true;
+                log.info(`Context service initialized with provider: ${provider.name}`);
+            } catch (error: unknown) {
+                const errorMessage = error instanceof Error ? error.message : String(error);
+                log.error(`Failed to initialize context service: ${errorMessage}`);
+                throw error;
+            } finally {
+                this.initPromise = null;
+            }
+        })();
+
+        return this.initPromise;
+    }
+
+    /**
+     * Process a user query to find relevant context in Trilium notes
+     *
+     * @param userQuestion - The user's query
+     * @param llmService - The LLM service to use
+     * @param options - Context processing options
+     * @returns Context information and relevant notes
+     */
+    async processQuery(
+        userQuestion: string,
+        llmService: LLMServiceInterface,
+        options: ContextOptions = {}
+    ): Promise<{
+        context: string;
+        sources: NoteSearchResult[];
+        thinking?: string;
+        decomposedQuery?: any;
+    }> {
+        // Set default options
+        const {
+            summarizeContent = false,
+            maxResults = 10,
+            contextNoteId = null,
+            useQueryEnhancement = true,
+            useQueryDecomposition = false,
+            showThinking = false
+        } = options;
+
+        log.info(`Processing query: "${userQuestion.substring(0, 50)}..."`);
+        log.info(`Options: summarize=${summarizeContent}, maxResults=${maxResults}, contextNoteId=${contextNoteId || 'global'}`);
+        log.info(`Processing: enhancement=${useQueryEnhancement}, decomposition=${useQueryDecomposition}, showThinking=${showThinking}`);
+
+        if (!this.initialized) {
+            try {
+                await this.initialize();
+            } catch (error) {
+                log.error(`Failed to initialize ContextService: ${error}`);
+                // Return a fallback response if initialization fails
+                return {
+                    context: CONTEXT_PROMPTS.NO_NOTES_CONTEXT,
+                    sources: [],
+                    thinking: undefined
+                };
+            }
+        }
+
+        try {
+            let decomposedQuery;
+            let searchQueries: string[] = [userQuestion];
+            let relevantNotes: NoteSearchResult[] = [];
+
+            // Step 1: Decompose query if requested
+            if (useQueryDecomposition) {
+                log.info(`Decomposing query for better understanding`);
+                try {
+                    // Use the async version with the LLM service
+                    decomposedQuery = await queryProcessor.decomposeQuery(userQuestion, undefined, llmService);
+                    log.info(`Successfully decomposed query complexity: ${decomposedQuery.complexity}/10 with ${decomposedQuery.subQueries.length} sub-queries`);
+                } catch (error) {
+                    log.error(`Error in query decomposition, using fallback: ${error}`);
+                    // Fallback to simpler decomposition
+                    decomposedQuery = {
+                        originalQuery: userQuestion,
+                        subQueries: [{
+                            id: `sq_fallback_${Date.now()}`,
+                            text: userQuestion,
+                            reason: "Fallback to original query due to decomposition error",
+                            isAnswered: false
+                        }],
+                        status: 'pending',
+                        complexity: 1
+                    };
+                }
+
+                // Extract sub-queries to use for search
+                if (decomposedQuery.subQueries.length > 0) {
+                    searchQueries = decomposedQuery.subQueries
+                        .map(sq => sq.text)
+                        .filter(text => text !== userQuestion); // Remove the original query to avoid duplication
+
+                    // Always include the original query
+                    searchQueries.unshift(userQuestion);
+
+                    log.info(`Query decomposed into ${searchQueries.length} search queries`);
+                }
+            }
+            // Step 2: Or enhance query if requested
+            else if (useQueryEnhancement) {
+                try {
+                    log.info(`Enhancing query for better semantic matching`);
+                    searchQueries = await queryProcessor.generateSearchQueries(userQuestion, llmService);
+                    log.info(`Generated ${searchQueries.length} enhanced search queries`);
+                } catch (error) {
+                    log.error(`Error generating search queries, using fallback: ${error}`);
+                    searchQueries = [userQuestion]; // Fallback to using the original question
+                }
+            }
+
+            // Step 3: Find relevant notes using vector search
+            const allResults = new Map<string, NoteSearchResult>();
+
+            for (const query of searchQueries) {
+                try {
+                    log.info(`Searching for: "${query.substring(0, 50)}..."`);
+
+                    // Use the unified vector search service
+                    const results = await vectorSearchService.findRelevantNotes(
+                        query,
+                        contextNoteId,
+                        {
+                            maxResults: maxResults,
+                            summarizeContent: summarizeContent,
+                            llmService: summarizeContent ? llmService : null
+                        }
+                    );
+
+                    log.info(`Found ${results.length} results for query "${query.substring(0, 30)}..."`);
+
+                    // Combine results, avoiding duplicates
+                    for (const result of results) {
+                        if (!allResults.has(result.noteId)) {
+                            allResults.set(result.noteId, result);
+                        } else {
+                            // If note already exists, update similarity to max of both values
+                            const existing = allResults.get(result.noteId);
+                            if (existing && result.similarity > existing.similarity) {
+                                existing.similarity = result.similarity;
+                                allResults.set(result.noteId, existing);
+                            }
+                        }
+                    }
+                } catch (error) {
+                    log.error(`Error searching for query "${query}": ${error}`);
+                }
+            }
+
+            // Convert to array and sort by similarity
+            relevantNotes = Array.from(allResults.values())
+                .sort((a, b) => b.similarity - a.similarity)
+                .slice(0, maxResults);
+
+            log.info(`Final combined results: ${relevantNotes.length} relevant notes`);
+
+            // Step 4: Build context from the notes
+            const provider = await providerManager.getPreferredEmbeddingProvider();
+            const providerId = provider?.name || 'default';
+
+            const context = await contextFormatter.buildContextFromNotes(
+                relevantNotes,
+                userQuestion,
+                providerId
+            );
+
+            // Step 5: Add agent tools context if requested
+            let enhancedContext = context;
+            let thinkingProcess: string | undefined = undefined;
+
+            if (showThinking) {
+                thinkingProcess = this.generateThinkingProcess(
+                    userQuestion,
+                    searchQueries,
+                    relevantNotes,
+                    decomposedQuery
+                );
+            }
+
+            return {
+                context: enhancedContext,
+                sources: relevantNotes,
+                thinking: thinkingProcess,
+                decomposedQuery
+            };
+        } catch (error) {
+            log.error(`Error processing query: ${error}`);
+            return {
+                context: CONTEXT_PROMPTS.NO_NOTES_CONTEXT,
+                sources: [],
+                thinking: undefined
+            };
+        }
+    }
+
+    /**
+     * Generate a thinking process for debugging and transparency
+     */
+    private generateThinkingProcess(
+        originalQuery: string,
+        searchQueries: string[],
+        relevantNotes: NoteSearchResult[],
+        decomposedQuery?: any
+    ): string {
+        let thinking = `## Query Processing\n\n`;
+        thinking += `Original query: "${originalQuery}"\n\n`;
+
+        // Add decomposition analysis if available
+        if (decomposedQuery) {
+            thinking += `Query complexity: ${decomposedQuery.complexity}/10\n\n`;
+            thinking += `### Decomposed into ${decomposedQuery.subQueries.length} sub-queries:\n`;
+
+            decomposedQuery.subQueries.forEach((sq: any, i: number) => {
+                thinking += `${i + 1}. ${sq.text}\n   Reason: ${sq.reason}\n\n`;
+            });
+        }
+
+        // Add search queries
+        thinking += `### Search Queries Used:\n`;
+        searchQueries.forEach((q, i) => {
+            thinking += `${i + 1}. "${q}"\n`;
+        });
+
+        // Add found sources
+        thinking += `\n## Sources Retrieved (${relevantNotes.length})\n\n`;
+
+        relevantNotes.slice(0, 5).forEach((note, i) => {
+            thinking += `${i + 1}. "${note.title}" (Score: ${Math.round(note.similarity * 100)}%)\n`;
+            thinking += `   ID: ${note.noteId}\n`;
+
+            // Check if parentPath exists before using it
+            if ('parentPath' in note && note.parentPath) {
+                thinking += `   Path: ${note.parentPath}\n`;
+            }
+
+            if (note.content) {
+                const contentPreview = note.content.length > 100
+                    ? note.content.substring(0, 100) + '...'
+                    : note.content;
+                thinking += `   Preview: ${contentPreview}\n`;
+            }
+
+            thinking += '\n';
+        });
+
+        if (relevantNotes.length > 5) {
+            thinking += `... and ${relevantNotes.length - 5} more sources\n`;
+        }
+
+        return thinking;
+    }
+
+    /**
+     * Find notes semantically related to a query
+     * (Shorthand method that directly uses vectorSearchService)
+     */
+    async findRelevantNotes(
+        query: string,
+        contextNoteId: string | null = null,
+        options: {
+            maxResults?: number,
+            summarize?: boolean,
+            llmService?: LLMServiceInterface | null
+        } = {}
+    ): Promise<NoteSearchResult[]> {
+        return vectorSearchService.findRelevantNotes(
+            query,
+            contextNoteId,
+            {
+                maxResults: options.maxResults,
+                summarizeContent: options.summarize,
+                llmService: options.llmService
+            }
+        );
+    }
+}
+
+// Export a singleton instance
+export default new ContextService();
diff --git a/src/services/llm/context/services/index.ts b/src/services/llm/context/services/index.ts
new file mode 100644
index 000000000..8ce9f9c7f
--- /dev/null
+++ b/src/services/llm/context/services/index.ts
@@ -0,0 +1,28 @@
+/**
+ * Consolidated Context Services
+ *
+ * This file exports the centralized context-related services that have been
+ * consolidated from previously overlapping implementations:
+ *
+ * - ContextService: Main entry point for context extraction operations
+ * - VectorSearchService: Unified semantic search functionality
+ * - QueryProcessor: Query enhancement and decomposition
+ */
+
+import contextService from './context_service.js';
+import vectorSearchService from './vector_search_service.js';
+import queryProcessor from './query_processor.js';
+
+export {
+  contextService,
+  vectorSearchService,
+  queryProcessor
+};
+
+// Export types
+export type { ContextOptions } from './context_service.js';
+export type { VectorSearchOptions } from './vector_search_service.js';
+export type { SubQuery, DecomposedQuery } from './query_processor.js';
+
+// Default export for backwards compatibility
+export default contextService;
diff --git a/src/services/llm/context/services/query_processor.ts b/src/services/llm/context/services/query_processor.ts
new file mode 100644
index 000000000..86e956457
--- /dev/null
+++ b/src/services/llm/context/services/query_processor.ts
@@ -0,0 +1,670 @@
+/**
+ * Unified Query Processor Service
+ *
+ * Consolidates functionality from:
+ * - query_enhancer.ts
+ * - query_decomposition_tool.ts
+ *
+ * This service provides a central interface for all query processing operations,
+ * including enhancement, decomposition, and complexity analysis.
+ */
+
+import log from '../../../log.js';
+import cacheManager from '../modules/cache_manager.js';
+import { CONTEXT_PROMPTS } from '../../constants/llm_prompt_constants.js';
+import { QUERY_DECOMPOSITION_STRINGS } from '../../constants/query_decomposition_constants.js';
+import JsonExtractor from '../../utils/json_extractor.js';
+import type { LLMServiceInterface } from '../../interfaces/agent_tool_interfaces.js';
+import { SEARCH_CONSTANTS } from '../../constants/search_constants.js';
+import aiServiceManager from '../../ai_service_manager.js';
+
+// Interfaces
+export interface SubQuery {
+    id: string;
+    text: string;
+    reason: string;
+    isAnswered: boolean;
+    answer?: string;
+}
+
+export interface DecomposedQuery {
+    originalQuery: string;
+    subQueries: SubQuery[];
+    status: 'pending' | 'in_progress' | 'completed';
+    complexity: number;
+}
+
+export class QueryProcessor {
+    private static queryCounter: number = 0;
+
+    // Prompt templates
+    private enhancerPrompt = CONTEXT_PROMPTS.QUERY_ENHANCER;
+
+    /**
+     * Get a valid LLM service or null if none available
+     *
+     * @returns Available LLM service or null
+     */
+    private async getLLMService(): Promise<LLMServiceInterface | null> {
+        try {
+            // Get the service from the AI service manager
+            return aiServiceManager.getService();
+        } catch (error: any) {
+            log.error(`Error getting LLM service: ${error.message || String(error)}`);
+            return null;
+        }
+    }
+    /**
+     * Generate search queries to find relevant information for the user question
+     *
+     * @param userQuestion - The user's question
+     * @param llmService - The LLM service to use for generating queries
+     * @returns Array of search queries
+     */
+    async generateSearchQueries(userQuestion: string, llmService: any): Promise<string[]> {
+        try {
+            // Check cache first
+            const cached = cacheManager.getQueryResults(`searchQueries:${userQuestion}`);
+
+            const PROMPT = `You are an AI assistant that decides what information needs to be retrieved from a user's knowledge base called TriliumNext Notes to answer the user's question.
+Given the user's question, generate 3-5 specific search queries that would help find relevant information.
+Each query should be focused on a different aspect of the question.
+Avoid generating queries that are too broad, vague, or about a user's entire Note database, and make sure they are relevant to the user's question.
+Format your answer as a JSON array of strings, with each string being a search query.
+Example: ["exact topic mentioned", "related concept 1", "related concept 2"]`
+
+            interface Message {
+                role: 'user' | 'assistant' | 'system';
+                content: string;
+            }
+
+            const messages: Message[] = [
+                { role: "system", content: PROMPT },
+                { role: "user", content: userQuestion }
+            ];
+
+            const options = {
+                temperature: 0.3,
+                maxTokens: 300
+            };
+
+            // Get the response from the LLM
+            const response = await llmService.generateChatCompletion(messages, options);
+            const responseText = response.text; // Extract the text from the response object
+
+            try {
+                // Remove code blocks, quotes, and clean up the response text
+                let jsonStr = responseText
+                    .replace(/```(?:json)?|```/g, '') // Remove code block markers
+                    .replace(/[\u201C\u201D]/g, '"')  // Replace smart quotes with straight quotes
+                    .trim();
+
+                log.info(`Cleaned JSON string: ${jsonStr}`);
+
+                // Check if the text might contain a JSON structure (has curly braces or square brackets)
+                if ((jsonStr.includes('{') && jsonStr.includes('}')) || (jsonStr.includes('[') && jsonStr.includes(']'))) {
+                    // Try to extract the JSON structure
+                    let jsonMatch = jsonStr.match(/(\{[\s\S]*\}|\[[\s\S]*\])/);
+                    if (jsonMatch) {
+                        jsonStr = jsonMatch[0];
+                        log.info(`Extracted JSON structure: ${jsonStr}`);
+                    }
+
+                    // Try to parse the JSON
+                    try {
+                        const parsed = JSON.parse(jsonStr);
+
+                        // Handle array format: ["query1", "query2"]
+                        if (Array.isArray(parsed)) {
+                            const result = parsed
+                                .map(q => typeof q === 'string' ? q.trim() : String(q).trim())
+                                .filter(Boolean);
+                            cacheManager.storeQueryResults(`searchQueries:${userQuestion}`, result);
+                            return result;
+                        }
+                        // Handle object format: {"query1": "reason1", "query2": "reason2"} or {"query1" : "query2"}
+                        else if (typeof parsed === 'object' && parsed !== null) {
+                            // Extract both keys and values as potential queries
+                            const keys = Object.keys(parsed);
+                            const values = Object.values(parsed);
+
+                            // Add keys as queries
+                            const keysResult = keys
+                                .filter(key => key && key.length > 3)
+                                .map(key => key.trim());
+
+                            // Add values as queries if they're strings and not already included
+                            const valuesResult = values
+                                .filter((val): val is string => typeof val === 'string' && val.length > 3)
+                                .map(val => val.trim())
+                                .filter(val => !keysResult.includes(val));
+
+                            const result = [...keysResult, ...valuesResult];
+                            cacheManager.storeQueryResults(`searchQueries:${userQuestion}`, result);
+                            return result;
+                        }
+                    } catch (parseError) {
+                        log.info(`JSON parse error: ${parseError}. Will use fallback parsing.`);
+                    }
+                }
+
+                // Fallback: Try to extract an array manually by splitting on commas between quotes
+                if (jsonStr.includes('[') && jsonStr.includes(']')) {
+                    const arrayContent = jsonStr.substring(
+                        jsonStr.indexOf('[') + 1,
+                        jsonStr.lastIndexOf(']')
+                    );
+
+                    // Use regex to match quoted strings, handling escaped quotes
+                    const stringMatches = arrayContent.match(/"((?:\\.|[^"\\])*)"/g);
+                    if (stringMatches && stringMatches.length > 0) {
+                        const result = stringMatches
+                            .map((m: string) => m.substring(1, m.length - 1).trim()) // Remove surrounding quotes
+                            .filter((s: string) => s.length > 0);
+                        cacheManager.storeQueryResults(`searchQueries:${userQuestion}`, result);
+                        return result;
+                    }
+                }
+
+                // Fallback: Try to extract key-value pairs from object notation manually
+                if (jsonStr.includes('{') && jsonStr.includes('}')) {
+                    // Extract content between curly braces
+                    const objectContent = jsonStr.substring(
+                        jsonStr.indexOf('{') + 1,
+                        jsonStr.lastIndexOf('}')
+                    );
+
+                    // Split by commas that aren't inside quotes
+                    const pairs: string[] = objectContent.split(/,(?=(?:[^"]*"[^"]*")*[^"]*$)/);
+
+                    const result = pairs
+                        .map(pair => {
+                            // Split by colon that isn't inside quotes
+                            const keyValue = pair.split(/:(?=(?:[^"]*"[^"]*")*[^"]*$)/);
+                            if (keyValue.length === 2) {
+                                const key = keyValue[0].replace(/"/g, '').trim();
+                                const value = keyValue[1].replace(/"/g, '').trim();
+
+                                if (key && key.length > 3) {
+                                    return key;
+                                }
+
+                                if (value && value.length > 3) {
+                                    return value;
+                                }
+                            }
+                            return null;
+                        })
+                        .filter((s: string | null) => s !== null);
+
+                    cacheManager.storeQueryResults(`searchQueries:${userQuestion}`, result);
+                    return result;
+                }
+            } catch (parseError) {
+                log.error(`Error parsing search queries: ${parseError}`);
+            }
+
+            // If all else fails, just use the original question
+            const fallback = [userQuestion];
+            cacheManager.storeQueryResults(`searchQueries:${userQuestion}`, fallback);
+            return fallback;
+        } catch (error: unknown) {
+            const errorMessage = error instanceof Error ? error.message : String(error);
+            log.error(`Error generating search queries: ${errorMessage}`);
+            // Fallback to just using the original question
+            return [userQuestion];
+        }
+    }
+
+    /**
+     * Break down a complex query into smaller, more manageable sub-queries
+     *
+     * @param query The original user query
+     * @param context Optional context about the current note being viewed
+     * @param llmService Optional LLM service to use for advanced decomposition
+     * @returns A decomposed query object with sub-queries
+     */
+    async decomposeQuery(
+        query: string,
+        context?: string,
+        llmService?: LLMServiceInterface
+    ): Promise<DecomposedQuery> {
+        try {
+            // Log the decomposition attempt
+            log.info(`Decomposing query: "${query}"`);
+
+            if (!query || query.trim().length === 0) {
+                log.info(`Query is empty, skipping decomposition`);
+                return {
+                    originalQuery: query,
+                    subQueries: [],
+                    status: 'pending',
+                    complexity: 0
+                };
+            }
+
+            // Simple assessment of query complexity
+            const complexity = query.length > 100 ? 5 : 3;
+
+            // Get LLM service if not provided
+            const service = llmService || await this.getLLMService();
+
+            // If no LLM service is available, use original query
+            if (!service) {
+                log.info(`No LLM service available for query decomposition, using original query`);
+                return {
+                    originalQuery: query,
+                    subQueries: [{
+                        id: this.generateSubQueryId(),
+                        text: query,
+                        reason: "Original query",
+                        isAnswered: false
+                    }],
+                    status: 'pending',
+                    complexity
+                };
+            }
+
+            // Make a simple request to decompose the query
+            const result = await this.simpleQueryDecomposition(query, service, context);
+
+            // Return the result
+            return {
+                originalQuery: query,
+                subQueries: result,
+                status: 'pending',
+                complexity
+            };
+        } catch (error: any) {
+            log.error(`Error decomposing query: ${error.message}`);
+
+            // Fallback to treating it as a simple query
+            return {
+                originalQuery: query,
+                subQueries: [{
+                    id: this.generateSubQueryId(),
+                    text: query,
+                    reason: "Error occurred during decomposition, using original query",
+                    isAnswered: false
+                }],
+                status: 'pending',
+                complexity: 1
+            };
+        }
+    }
+
+    /**
+     * Simple LLM-based query decomposition
+     *
+     * @param query The original query to decompose
+     * @param llmService LLM service to use
+     * @param context Optional context to help with decomposition
+     * @returns Array of sub-queries
+     */
+    private async simpleQueryDecomposition(
+        query: string,
+        llmService: LLMServiceInterface,
+        context?: string
+    ): Promise<SubQuery[]> {
+        try {
+            // Use the proven prompt format that was working before
+            const prompt = `You are an AI assistant that decides what information needs to be retrieved from a user's knowledge base called TriliumNext Notes to answer the user's question.
+Given the user's question, generate 3-5 specific search queries that would help find relevant information.
+Each query should be focused on a different aspect of the question.
+Avoid generating queries that are too broad, vague, or about a user's entire Note database, and make sure they are relevant to the user's question.
+Format your answer as a JSON array of strings, with each string being a search query.
+Example: ["exact topic mentioned", "related concept 1", "related concept 2"]`;
+
+            log.info(`Sending decomposition prompt to LLM for query: "${query}"`);
+
+            const messages = [
+                { role: "system" as const, content: prompt },
+                { role: "user" as const, content: query }
+            ];
+
+            const options = {
+                temperature: 0.3,
+                maxTokens: 300,
+                bypassFormatter: true,
+                expectsJsonResponse: true,
+                _bypassContextProcessing: true,
+                enableTools: false
+            };
+
+            // Get the response from the LLM
+            const response = await llmService.generateChatCompletion(messages, options);
+            const responseText = response.text;
+
+            log.info(`Received LLM response for decomposition: ${responseText.substring(0, 200)}...`);
+
+            // Parse the response to extract the queries
+            let searchQueries: string[] = [];
+            try {
+                // Remove code blocks, quotes, and clean up the response text
+                let jsonStr = responseText
+                    .replace(/```(?:json)?|```/g, '') // Remove code block markers
+                    .replace(/[\u201C\u201D]/g, '"')  // Replace smart quotes with straight quotes
+                    .trim();
+
+                log.info(`Cleaned JSON string: ${jsonStr}`);
+
+                // Check if the text might contain a JSON structure (has curly braces or square brackets)
+                if ((jsonStr.includes('{') && jsonStr.includes('}')) || (jsonStr.includes('[') && jsonStr.includes(']'))) {
+                    // Try to extract the JSON structure
+                    let jsonMatch = jsonStr.match(/(\{[\s\S]*\}|\[[\s\S]*\])/);
+                    if (jsonMatch) {
+                        jsonStr = jsonMatch[0];
+                        log.info(`Extracted JSON structure: ${jsonStr}`);
+                    }
+
+                    // Try to parse the JSON
+                    try {
+                        const parsed = JSON.parse(jsonStr);
+
+                        // Handle array format: ["query1", "query2"]
+                        if (Array.isArray(parsed)) {
+                            searchQueries = parsed
+                                .map(q => typeof q === 'string' ? q.trim() : String(q).trim())
+                                .filter(Boolean);
+                            log.info(`Extracted ${searchQueries.length} queries from JSON array`);
+                        }
+                        // Handle object format: {"query1": "reason1", "query2": "reason2"} or {"query1" : "query2"}
+                        else if (typeof parsed === 'object' && parsed !== null) {
+                            // Extract both keys and values as potential queries
+                            const keys = Object.keys(parsed);
+                            const values = Object.values(parsed);
+
+                            // Add keys as queries
+                            searchQueries = keys
+                                .filter(key => key && key.length > 3)
+                                .map(key => key.trim());
+
+                            // Add values as queries if they're strings and not already included
+                            values
+                                .filter((val): val is string => typeof val === 'string' && val.length > 3)
+                                .map(val => val.trim())
+                                .forEach((val: string) => {
+                                    if (!searchQueries.includes(val)) {
+                                        searchQueries.push(val);
+                                    }
+                                });
+
+                            log.info(`Extracted ${searchQueries.length} queries from JSON object`);
+                        }
+                    } catch (parseError) {
+                        log.info(`JSON parse error: ${parseError}. Will use fallback parsing.`);
+                    }
+                }
+
+                // Fallback: Try to extract an array manually by splitting on commas between quotes
+                if (searchQueries.length === 0 && jsonStr.includes('[') && jsonStr.includes(']')) {
+                    const arrayContent = jsonStr.substring(
+                        jsonStr.indexOf('[') + 1,
+                        jsonStr.lastIndexOf(']')
+                    );
+
+                    // Use regex to match quoted strings, handling escaped quotes
+                    const stringMatches = arrayContent.match(/"((?:\\.|[^"\\])*)"/g);
+                    if (stringMatches && stringMatches.length > 0) {
+                        searchQueries = stringMatches
+                            .map((m: string) => m.substring(1, m.length - 1).trim()) // Remove surrounding quotes
+                            .filter((s: string) => s.length > 0);
+                        log.info(`Extracted ${searchQueries.length} queries using regex`);
+                    }
+                }
+
+                // Fallback: Try to extract key-value pairs from object notation manually
+                if (searchQueries.length === 0 && jsonStr.includes('{') && jsonStr.includes('}')) {
+                    // Extract content between curly braces
+                    const objectContent = jsonStr.substring(
+                        jsonStr.indexOf('{') + 1,
+                        jsonStr.lastIndexOf('}')
+                    );
+
+                    // Split by commas that aren't inside quotes
+                    const pairs: string[] = objectContent.split(/,(?=(?:[^"]*"[^"]*")*[^"]*$)/);
+
+                    for (const pair of pairs) {
+                        // Split by colon that isn't inside quotes
+                        const keyValue = pair.split(/:(?=(?:[^"]*"[^"]*")*[^"]*$)/);
+                        if (keyValue.length === 2) {
+                            const key = keyValue[0].replace(/"/g, '').trim();
+                            const value = keyValue[1].replace(/"/g, '').trim();
+
+                            if (key && key.length > 3 && !searchQueries.includes(key)) {
+                                searchQueries.push(key);
+                            }
+
+                            if (value && value.length > 3 && !searchQueries.includes(value)) {
+                                searchQueries.push(value);
+                            }
+                        }
+                    }
+
+                    log.info(`Extracted ${searchQueries.length} queries from manual object parsing`);
+                }
+
+                // Convert search queries to SubQuery objects
+                if (searchQueries.length > 0) {
+                    const subQueries = searchQueries.map((text, index) => ({
+                        id: this.generateSubQueryId(),
+                        text,
+                        reason: `Search query ${index + 1}`,
+                        isAnswered: false
+                    }));
+
+                    // Always include the original query if not already included
+                    const hasOriginal = subQueries.some(sq => sq.text.toLowerCase().includes(query.toLowerCase()) || query.toLowerCase().includes(sq.text.toLowerCase()));
+                    if (!hasOriginal) {
+                        subQueries.unshift({
+                            id: this.generateSubQueryId(),
+                            text: query.trim(),
+                            reason: "Original query",
+                            isAnswered: false
+                        });
+                        log.info(`Added original query to sub-queries list`);
+                    }
+
+                    log.info(`Final sub-queries for vector search: ${subQueries.map(sq => `"${sq.text}"`).join(', ')}`);
+                    return subQueries;
+                }
+            } catch (parseError) {
+                log.error(`Error parsing search queries: ${parseError}`);
+            }
+
+            // Fallback if all extraction methods fail
+            log.info(`Using fallback queries`);
+            return [
+                {
+                    id: this.generateSubQueryId(),
+                    text: query,
+                    reason: "Original query",
+                    isAnswered: false
+                },
+                {
+                    id: this.generateSubQueryId(),
+                    text: `${query.trim()} overview`,
+                    reason: "General information",
+                    isAnswered: false
+                },
+                {
+                    id: this.generateSubQueryId(),
+                    text: `${query.trim()} examples`,
+                    reason: "Practical examples",
+                    isAnswered: false
+                }
+            ];
+        } catch (error) {
+            log.error(`Error in simpleQueryDecomposition: ${error}`);
+
+            // Return the original query as fallback
+            return [{
+                id: this.generateSubQueryId(),
+                text: query,
+                reason: "Error occurred, using original query",
+                isAnswered: false
+            }];
+        }
+    }
+
+    /**
+     * Generate a unique ID for a sub-query
+     *
+     * @returns A unique sub-query ID
+     */
+    private generateSubQueryId(): string {
+        QueryProcessor.queryCounter++;
+        return `sq_${Date.now()}_${QueryProcessor.queryCounter}`;
+    }
+
+    /**
+     * Assess the complexity of a query on a scale of 1-10
+     * This helps determine if decomposition is needed
+     *
+     * @param query The query to assess
+     * @returns A complexity score from 1-10
+     */
+    assessQueryComplexity(query: string): number {
+        let score = 0;
+
+        // Factor 1: Length - longer queries tend to be more complex
+        // 0-1.5 points for length
+        const lengthScore = Math.min(query.length / 100, 1.5);
+        score += lengthScore;
+
+        // Factor 2: Question marks - multiple questions are more complex
+        // 0-2 points for question marks
+        const questionMarkCount = (query.match(/\?/g) || []).length;
+        score += Math.min(questionMarkCount * 0.8, 2);
+
+        // Factor 3: Question words - multiple "wh" questions indicate complexity
+        // 0-2 points for question words
+        const questionWords = ['what', 'why', 'how', 'when', 'where', 'who', 'which'];
+        let questionWordCount = 0;
+
+        for (const word of questionWords) {
+            const regex = new RegExp(`\\b${word}\\b`, 'gi');
+            questionWordCount += (query.match(regex) || []).length;
+        }
+
+        score += Math.min(questionWordCount * 0.5, 2);
+
+        // Factor 4: Conjunctions - linking multiple concepts increases complexity
+        // 0-1.5 points for conjunctions
+        const conjunctions = ['and', 'or', 'but', 'however', 'although', 'nevertheless', 'despite', 'whereas'];
+        let conjunctionCount = 0;
+
+        for (const conj of conjunctions) {
+            const regex = new RegExp(`\\b${conj}\\b`, 'gi');
+            conjunctionCount += (query.match(regex) || []).length;
+        }
+
+        score += Math.min(conjunctionCount * 0.3, 1.5);
+
+        // Factor 5: Comparison terms - comparisons are complex
+        // 0-1.5 points for comparison terms
+        const comparisonTerms = ['compare', 'difference', 'differences', 'versus', 'vs', 'similarities', 'better', 'worse'];
+        let comparisonCount = 0;
+
+        for (const term of comparisonTerms) {
+            const regex = new RegExp(`\\b${term}\\b`, 'gi');
+            comparisonCount += (query.match(regex) || []).length;
+        }
+
+        score += Math.min(comparisonCount * 0.7, 1.5);
+
+        // Factor 6: Technical terms and depth indicators
+        // 0-1.5 points for depth indicators
+        const depthTerms = ['explain', 'detail', 'elaborate', 'in-depth', 'comprehensive', 'thoroughly', 'analysis'];
+        let depthCount = 0;
+
+        for (const term of depthTerms) {
+            const regex = new RegExp(`\\b${term}\\b`, 'gi');
+            depthCount += (query.match(regex) || []).length;
+        }
+
+        score += Math.min(depthCount * 0.5, 1.5);
+
+        // Return final score, capped at 10
+        return Math.min(Math.round(score), 10);
+    }
+
+    /**
+     * Update a sub-query with its answer
+     *
+     * @param decomposedQuery The decomposed query object
+     * @param subQueryId The ID of the sub-query to update
+     * @param answer The answer to the sub-query
+     * @returns The updated decomposed query
+     */
+    updateSubQueryAnswer(
+        decomposedQuery: DecomposedQuery,
+        subQueryId: string,
+        answer: string
+    ): DecomposedQuery {
+        const updatedSubQueries = decomposedQuery.subQueries.map(sq => {
+            if (sq.id === subQueryId) {
+                return {
+                    ...sq,
+                    answer,
+                    isAnswered: true
+                };
+            }
+            return sq;
+        });
+
+        // Check if all sub-queries are answered
+        const allAnswered = updatedSubQueries.every(sq => sq.isAnswered);
+
+        return {
+            ...decomposedQuery,
+            subQueries: updatedSubQueries,
+            status: allAnswered ? 'completed' : 'in_progress'
+        };
+    }
+
+    /**
+     * Synthesize all sub-query answers into a comprehensive response
+     *
+     * @param decomposedQuery The decomposed query with all sub-queries answered
+     * @returns A synthesized answer to the original query
+     */
+    synthesizeAnswer(decomposedQuery: DecomposedQuery): string {
+        try {
+            // Ensure all sub-queries are answered
+            if (!decomposedQuery.subQueries.every(sq => sq.isAnswered)) {
+                return "Cannot synthesize answer until all sub-queries are answered.";
+            }
+
+            // For simple queries with just one sub-query, return the answer directly
+            if (decomposedQuery.subQueries.length === 1) {
+                return decomposedQuery.subQueries[0].answer || "";
+            }
+
+            // For complex queries, build a structured response
+            let synthesized = `Answer to: ${decomposedQuery.originalQuery}\n\n`;
+
+            // Group by themes if there are many sub-queries
+            if (decomposedQuery.subQueries.length > 3) {
+                synthesized += "Based on the information gathered:\n\n";
+
+                for (const sq of decomposedQuery.subQueries) {
+                    synthesized += `${sq.answer}\n\n`;
+                }
+            } else {
+                // For fewer sub-queries, present each one with its question
+                for (const sq of decomposedQuery.subQueries) {
+                    synthesized += `${sq.answer}\n\n`;
+                }
+            }
+
+            return synthesized.trim();
+        } catch (error: any) {
+            log.error(`Error synthesizing answer: ${error.message}`);
+            return "An error occurred while synthesizing the answer.";
+        }
+    }
+}
+
+// Export a singleton instance
+export default new QueryProcessor();
diff --git a/src/services/llm/context/services/vector_search_service.ts b/src/services/llm/context/services/vector_search_service.ts
new file mode 100644
index 000000000..aa916ed0a
--- /dev/null
+++ b/src/services/llm/context/services/vector_search_service.ts
@@ -0,0 +1,452 @@
+/**
+ * Unified Vector Search Service
+ *
+ * Consolidates functionality from:
+ * - semantic_search.ts
+ * - vector_search_stage.ts
+ *
+ * This service provides a central interface for all vector search operations,
+ * supporting both full and summarized note context extraction.
+ */
+
+import * as vectorStore from '../../embeddings/index.js';
+import { cosineSimilarity } from '../../embeddings/index.js';
+import log from '../../../log.js';
+import becca from '../../../../becca/becca.js';
+import providerManager from '../modules/provider_manager.js';
+import cacheManager from '../modules/cache_manager.js';
+import type { NoteSearchResult } from '../../interfaces/context_interfaces.js';
+import type { LLMServiceInterface } from '../../interfaces/agent_tool_interfaces.js';
+import { SEARCH_CONSTANTS } from '../../constants/search_constants.js';
+
+export interface VectorSearchOptions {
+    maxResults?: number;
+    threshold?: number;
+    useEnhancedQueries?: boolean;
+    summarizeContent?: boolean;
+    llmService?: LLMServiceInterface | null;
+}
+
+export class VectorSearchService {
+    private contextExtractor: any;
+
+    constructor() {
+        // Lazy load the context extractor to avoid circular dependencies
+        import('../index.js').then(module => {
+            this.contextExtractor = new module.ContextExtractor();
+        });
+    }
+
+    /**
+     * Find notes that are semantically relevant to a query
+     *
+     * @param query - The search query
+     * @param contextNoteId - Optional note ID to restrict search to a branch
+     * @param options - Search options including result limit and summarization preference
+     * @returns Array of relevant notes with similarity scores
+     */
+    async findRelevantNotes(
+        query: string,
+        contextNoteId: string | null = null,
+        options: VectorSearchOptions = {}
+    ): Promise<NoteSearchResult[]> {
+        const {
+            maxResults = SEARCH_CONSTANTS.VECTOR_SEARCH.DEFAULT_MAX_RESULTS,
+            threshold = SEARCH_CONSTANTS.VECTOR_SEARCH.DEFAULT_THRESHOLD,
+            useEnhancedQueries = false,
+            summarizeContent = false,
+            llmService = null
+        } = options;
+
+        log.info(`VectorSearchService: Finding relevant notes for "${query}"`);
+        log.info(`Parameters: contextNoteId=${contextNoteId || 'global'}, maxResults=${maxResults}, summarize=${summarizeContent}`);
+
+        try {
+            // Check cache first
+            const cacheKey = `find:${query}:${contextNoteId || 'all'}:${maxResults}:${summarizeContent}`;
+            const cached = cacheManager.getQueryResults<NoteSearchResult[]>(cacheKey);
+            if (cached && Array.isArray(cached)) {
+                log.info(`VectorSearchService: Returning ${cached.length} cached results`);
+                return cached;
+            }
+
+            // Get embedding for query
+            const queryEmbedding = await providerManager.generateQueryEmbedding(query);
+            if (!queryEmbedding) {
+                log.error('Failed to generate query embedding');
+                return [];
+            }
+
+            // Get provider information
+            const provider = await providerManager.getPreferredEmbeddingProvider();
+            if (!provider) {
+                log.error('No embedding provider available');
+                return [];
+            }
+
+            // Find similar notes based on embeddings
+            let noteResults: { noteId: string, similarity: number }[] = [];
+
+            // If contextNoteId is provided, search only within that branch
+            if (contextNoteId) {
+                noteResults = await this.findNotesInBranch(
+                    queryEmbedding,
+                    contextNoteId,
+                    maxResults
+                );
+            } else {
+                // Otherwise search across all notes with embeddings
+                noteResults = await vectorStore.findSimilarNotes(
+                    queryEmbedding,
+                    provider.name,
+                    provider.getConfig().model || '',
+                    maxResults
+                );
+            }
+
+            // Ensure context extractor is loaded
+            if (!this.contextExtractor) {
+                const module = await import('../index.js');
+                this.contextExtractor = new module.ContextExtractor();
+            }
+
+            // Get note details for results
+            const enrichedResults = await Promise.all(
+                noteResults.map(async result => {
+                    const note = becca.getNote(result.noteId);
+                    if (!note) {
+                        return null;
+                    }
+
+                    // Get note content - full or summarized based on option
+                    let content: string | null = null;
+
+                    if (summarizeContent) {
+                        content = await this.getSummarizedNoteContent(result.noteId, llmService);
+                    } else {
+                        content = await this.contextExtractor.getNoteContent(result.noteId);
+                    }
+
+                    // Adjust similarity score based on content quality
+                    let adjustedSimilarity = result.similarity;
+
+                    // Penalize notes with empty or minimal content
+                    if (!content || content.trim().length <= 10) {
+                        adjustedSimilarity *= 0.2;
+                    }
+                    // Slightly boost notes with substantial content
+                    else if (content.length > 100) {
+                        adjustedSimilarity = Math.min(1.0, adjustedSimilarity * 1.1);
+                    }
+
+                    // Get primary parent note ID
+                    const parentNotes = note.getParentNotes();
+                    const parentId = parentNotes.length > 0 ? parentNotes[0].noteId : undefined;
+
+                    // Create parent chain for context
+                    const parentPath = await this.getParentPath(result.noteId);
+
+                    return {
+                        noteId: result.noteId,
+                        title: note.title,
+                        content,
+                        similarity: adjustedSimilarity,
+                        parentId,
+                        parentPath
+                    };
+                })
+            );
+
+            // Filter out null results and notes with very low similarity
+            const filteredResults = enrichedResults.filter(result =>
+                result !== null && result.similarity > threshold
+            ) as NoteSearchResult[];
+
+            // Sort results by adjusted similarity
+            filteredResults.sort((a, b) => b.similarity - a.similarity);
+
+            // Limit to requested number of results
+            const limitedResults = filteredResults.slice(0, maxResults);
+
+            // Cache results
+            cacheManager.storeQueryResults(cacheKey, limitedResults);
+
+            log.info(`VectorSearchService: Found ${limitedResults.length} relevant notes`);
+            return limitedResults;
+        } catch (error) {
+            log.error(`Error finding relevant notes: ${error}`);
+            return [];
+        }
+    }
+
+    /**
+     * Get a summarized version of note content
+     *
+     * @param noteId - The note ID to summarize
+     * @param llmService - Optional LLM service for summarization
+     * @returns Summarized content or full content if summarization fails
+     */
+    private async getSummarizedNoteContent(
+        noteId: string,
+        llmService: LLMServiceInterface | null
+    ): Promise<string | null> {
+        try {
+            // Get the full content first
+            const fullContent = await this.contextExtractor.getNoteContent(noteId);
+            if (!fullContent || fullContent.length < 500) {
+                // Don't summarize short content
+                return fullContent;
+            }
+
+            // Check if we have an LLM service for summarization
+            if (!llmService) {
+                // If no LLM service, truncate the content instead
+                return fullContent.substring(0, 500) + "...";
+            }
+
+            // Check cache for summarized content
+            const cacheKey = `summary:${noteId}:${fullContent.length}`;
+            const cached = cacheManager.getNoteData(noteId, cacheKey);
+            if (cached) {
+                return cached as string;
+            }
+
+            const note = becca.getNote(noteId);
+            if (!note) return null;
+
+            // Prepare a summarization prompt
+            const messages = [
+                {
+                    role: "system" as const,
+                    content: "Summarize the following note content concisely while preserving key information. Keep your summary to about 20% of the original length."
+                },
+                {
+                    role: "user" as const,
+                    content: `Note title: ${note.title}\n\nContent:\n${fullContent}`
+                }
+            ];
+
+            // Request summarization with safeguards to prevent recursion
+            const result = await llmService.generateChatCompletion(messages, {
+                temperature: SEARCH_CONSTANTS.TEMPERATURE.VECTOR_SEARCH,
+                maxTokens: SEARCH_CONSTANTS.LIMITS.VECTOR_SEARCH_MAX_TOKENS,
+                // Use any to bypass type checking for these special options
+                // that are recognized by the LLM service but not in the interface
+                ...(({
+                    bypassFormatter: true,
+                    bypassContextProcessing: true,
+                    enableTools: false
+                } as any))
+            });
+
+            const summary = result.text;
+
+            // Cache the summarization result
+            cacheManager.storeNoteData(noteId, cacheKey, summary);
+
+            return summary;
+        } catch (error) {
+            log.error(`Error summarizing note content: ${error}`);
+            // Fall back to getting the full content
+            return this.contextExtractor.getNoteContent(noteId);
+        }
+    }
+
+    /**
+     * Find notes in a specific branch (subtree) that are relevant to a query
+     *
+     * @param embedding - The query embedding
+     * @param contextNoteId - Root note ID of the branch
+     * @param limit - Maximum results to return
+     * @returns Array of note IDs with similarity scores
+     */
+    private async findNotesInBranch(
+        embedding: Float32Array,
+        contextNoteId: string,
+        limit = SEARCH_CONSTANTS.CONTEXT.MAX_SIMILAR_NOTES
+    ): Promise<{ noteId: string, similarity: number }[]> {
+        try {
+            // Get all notes in the subtree
+            const noteIds = await this.getSubtreeNoteIds(contextNoteId);
+
+            if (noteIds.length === 0) {
+                return [];
+            }
+
+            // Get provider information
+            const provider = await providerManager.getPreferredEmbeddingProvider();
+            if (!provider) {
+                log.error('No embedding provider available');
+                return [];
+            }
+
+            // Get model configuration
+            const model = provider.getConfig().model || '';
+            const providerName = provider.name;
+
+            // Get embeddings for all notes in the branch
+            const results: { noteId: string, similarity: number }[] = [];
+
+            for (const noteId of noteIds) {
+                try {
+                    // Get note embedding
+                    const embeddingResult = await vectorStore.getEmbeddingForNote(
+                        noteId,
+                        providerName,
+                        model
+                    );
+
+                    if (embeddingResult && embeddingResult.embedding) {
+                        // Calculate similarity
+                        const similarity = cosineSimilarity(embedding, embeddingResult.embedding);
+                        results.push({ noteId, similarity });
+                    }
+                } catch (error) {
+                    log.error(`Error processing note ${noteId} for branch search: ${error}`);
+                }
+            }
+
+            // Sort by similarity and return top results
+            return results
+                .sort((a, b) => b.similarity - a.similarity)
+                .slice(0, limit);
+        } catch (error) {
+            log.error(`Error in branch search: ${error}`);
+            return [];
+        }
+    }
+
+    /**
+     * Get all note IDs in a subtree (branch)
+     *
+     * @param rootNoteId - The root note ID of the branch
+     * @returns Array of note IDs in the subtree
+     */
+    private async getSubtreeNoteIds(rootNoteId: string): Promise<string[]> {
+        try {
+            const note = becca.getNote(rootNoteId);
+            if (!note) return [];
+
+            const noteIds = new Set<string>([rootNoteId]);
+            const processChildNotes = async (noteId: string) => {
+                const childNotes = becca.getNote(noteId)?.getChildNotes() || [];
+                for (const childNote of childNotes) {
+                    if (!noteIds.has(childNote.noteId)) {
+                        noteIds.add(childNote.noteId);
+                        await processChildNotes(childNote.noteId);
+                    }
+                }
+            };
+
+            await processChildNotes(rootNoteId);
+            return Array.from(noteIds);
+        } catch (error) {
+            log.error(`Error getting subtree note IDs: ${error}`);
+            return [];
+        }
+    }
+
+    /**
+     * Get the parent path for a note (for additional context)
+     *
+     * @param noteId - The note ID to get the parent path for
+     * @returns String representation of the parent path
+     */
+    private async getParentPath(noteId: string): Promise<string> {
+        try {
+            const note = becca.getNote(noteId);
+            if (!note) return '';
+
+            const path: string[] = [];
+            const parentNotes = note.getParentNotes();
+            let currentNote = parentNotes.length > 0 ? parentNotes[0] : null;
+
+            // Build path up to the maximum parent depth
+            let level = 0;
+            while (currentNote && level < SEARCH_CONSTANTS.CONTEXT.MAX_PARENT_DEPTH) {
+                path.unshift(currentNote.title);
+                const grandParents = currentNote.getParentNotes();
+                currentNote = grandParents.length > 0 ? grandParents[0] : null;
+                level++;
+            }
+
+            return path.join(' > ');
+        } catch (error) {
+            log.error(`Error getting parent path: ${error}`);
+            return '';
+        }
+    }
+
+    /**
+     * Find notes that are semantically relevant to multiple queries
+     * Combines results from multiple queries, deduplicates them, and returns the most relevant ones
+     *
+     * @param queries - Array of search queries
+     * @param contextNoteId - Optional note ID to restrict search to a branch
+     * @param options - Search options including result limit and summarization preference
+     * @returns Array of relevant notes with similarity scores, deduplicated and sorted
+     */
+    async findRelevantNotesMultiQuery(
+        queries: string[],
+        contextNoteId: string | null = null,
+        options: VectorSearchOptions = {}
+    ): Promise<NoteSearchResult[]> {
+        if (!queries || queries.length === 0) {
+            log.info('No queries provided to findRelevantNotesMultiQuery');
+            return [];
+        }
+
+        log.info(`VectorSearchService: Finding relevant notes for ${queries.length} queries`);
+        log.info(`Multi-query parameters: contextNoteId=${contextNoteId || 'global'}, queries=${JSON.stringify(queries.map(q => q.substring(0, 20) + '...'))}`);
+
+        try {
+            // Create a Map to deduplicate results across queries
+            const allResults = new Map<string, NoteSearchResult>();
+
+            // For each query, adjust maxResults to avoid getting too many total results
+            const adjustedMaxResults = options.maxResults ?
+                Math.ceil(options.maxResults / queries.length) :
+                Math.ceil(SEARCH_CONSTANTS.VECTOR_SEARCH.DEFAULT_MAX_RESULTS / queries.length);
+
+            // Search for each query and combine results
+            for (const query of queries) {
+                try {
+                    const queryOptions = {
+                        ...options,
+                        maxResults: adjustedMaxResults,
+                        useEnhancedQueries: false // We're already using enhanced queries
+                    };
+
+                    const results = await this.findRelevantNotes(query, contextNoteId, queryOptions);
+
+                    // Merge results, keeping the highest similarity score for duplicates
+                    for (const note of results) {
+                        if (!allResults.has(note.noteId) ||
+                            (allResults.has(note.noteId) && note.similarity > (allResults.get(note.noteId)?.similarity || 0))) {
+                            allResults.set(note.noteId, note);
+                        }
+                    }
+
+                    log.info(`Found ${results.length} results for query: "${query.substring(0, 30)}..."`);
+                } catch (error) {
+                    log.error(`Error searching for query "${query}": ${error}`);
+                }
+            }
+
+            // Convert map to array and sort by similarity
+            const combinedResults = Array.from(allResults.values())
+                .sort((a, b) => b.similarity - a.similarity)
+                .slice(0, options.maxResults || SEARCH_CONSTANTS.VECTOR_SEARCH.DEFAULT_MAX_RESULTS);
+
+            log.info(`VectorSearchService: Found ${combinedResults.length} total deduplicated results across ${queries.length} queries`);
+
+            return combinedResults;
+        } catch (error) {
+            log.error(`Error in findRelevantNotesMultiQuery: ${error}`);
+            return [];
+        }
+    }
+}
+
+// Export a singleton instance
+export default new VectorSearchService();
diff --git a/src/services/llm/context/summarization.ts b/src/services/llm/context/summarization.ts
new file mode 100644
index 000000000..40b86512c
--- /dev/null
+++ b/src/services/llm/context/summarization.ts
@@ -0,0 +1,162 @@
+/**
+ * Contains functions for generating summaries of note content
+ * Used to provide concise context for LLM processing
+ */
+
+import { sanitizeHtmlContent } from './note_content.js';
+
+/**
+ * Options for summarization
+ */
+export interface SummarizationOptions {
+    /**
+     * Maximum length of the summary in characters
+     */
+    maxLength?: number;
+
+    /**
+     * Whether to include title in the summary
+     */
+    includeTitle?: boolean;
+
+    /**
+     * Minimum content length to trigger summarization
+     */
+    minContentLengthForSummarization?: number;
+}
+
+/**
+ * Default summarization options
+ */
+const DEFAULT_SUMMARIZATION_OPTIONS: Required<SummarizationOptions> = {
+    maxLength: 500,
+    includeTitle: true,
+    minContentLengthForSummarization: 1000
+};
+
+/**
+ * Summarize note content
+ * If the content is smaller than minContentLengthForSummarization, returns trimmed content
+ * This is a local implementation that doesn't require API calls
+ */
+export function summarizeContent(
+    content: string,
+    title: string = '',
+    options: SummarizationOptions = {}
+): string {
+    // Merge provided options with defaults
+    const config: Required<SummarizationOptions> = {
+        ...DEFAULT_SUMMARIZATION_OPTIONS,
+        ...options
+    };
+
+    // Clean up the content
+    const cleanedContent = sanitizeHtmlContent(content);
+
+    // If content is small enough, no need to summarize
+    if (cleanedContent.length < config.minContentLengthForSummarization) {
+        // Just truncate if needed
+        if (cleanedContent.length > config.maxLength) {
+            return cleanedContent.substring(0, config.maxLength) + '...';
+        }
+        return cleanedContent;
+    }
+
+    // Use local summarization
+    return generateLocalSummary(cleanedContent, config);
+}
+
+/**
+ * Generate a simple summary locally without using LLM API
+ */
+function generateLocalSummary(content: string, options: Required<SummarizationOptions>): string {
+    // Simple heuristic approach - extract first paragraph and some key sentences
+
+    // First, try to get the first paragraph that has reasonable length
+    const paragraphs = content.split(/\n\s*\n/);
+    let summary = '';
+
+    for (const paragraph of paragraphs) {
+        if (paragraph.length > 30 && !paragraph.startsWith('#') && !paragraph.startsWith('!')) {
+            summary = paragraph;
+            break;
+        }
+    }
+
+    // If no good paragraph found, use the first X characters
+    if (!summary) {
+        summary = content.substring(0, options.maxLength * 0.8);
+    }
+
+    // Truncate if too long
+    if (summary.length > options.maxLength) {
+        summary = summary.substring(0, options.maxLength) + '...';
+    }
+
+    return summary;
+}
+
+/**
+ * Extract key points from content
+ * Returns a bulleted list of key points
+ * This is a local implementation that doesn't require API calls
+ */
+export function extractKeyPoints(
+    content: string,
+    maxPoints: number = 5
+): string[] {
+    // Clean up the content
+    const cleanedContent = sanitizeHtmlContent(content);
+
+    // Use local extraction
+    return generateLocalKeyPoints(cleanedContent, maxPoints);
+}
+
+/**
+ * Generate key points locally without using LLM API
+ */
+function generateLocalKeyPoints(content: string, maxPoints: number): string[] {
+    // Simple approach - look for sentences that might contain key information
+    const sentences = content
+        .replace(/\n+/g, ' ')
+        .split(/[.!?]/)
+        .map(s => s.trim())
+        .filter(s => s.length > 20);
+
+    // Heuristics for important sentences - look for indicator phrases
+    const importanceMarkers = [
+        'important', 'key', 'significant', 'essential', 'critical',
+        'main', 'primary', 'crucial', 'vital', 'fundamental',
+        'in summary', 'to summarize', 'in conclusion', 'conclude',
+        'therefore', 'thus', 'consequently', 'as a result'
+    ];
+
+    // Score sentences based on potential importance
+    const scoredSentences = sentences.map(sentence => {
+        let score = 0;
+
+        // Sentences at the beginning or end are often important
+        if (sentences.indexOf(sentence) < sentences.length * 0.1) score += 3;
+        if (sentences.indexOf(sentence) > sentences.length * 0.9) score += 4;
+
+        // Check for importance markers
+        for (const marker of importanceMarkers) {
+            if (sentence.toLowerCase().includes(marker)) {
+                score += 2;
+            }
+        }
+
+        // Prefer medium-length sentences
+        if (sentence.length > 40 && sentence.length < 150) score += 2;
+
+        return { sentence, score };
+    });
+
+    // Sort by score and take top N
+    const topSentences = scoredSentences
+        .sort((a, b) => b.score - a.score)
+        .slice(0, maxPoints)
+        .map(item => item.sentence + '.');
+
+    return topSentences;
+}
diff --git a/src/services/llm/context_extractors/contextual_thinking_tool.ts b/src/services/llm/context_extractors/contextual_thinking_tool.ts
new file mode 100644
index 000000000..de48778e6
--- /dev/null
+++ b/src/services/llm/context_extractors/contextual_thinking_tool.ts
@@ -0,0 +1,443 @@
+/**
+ * Contextual Thinking Tool
+ *
+ * Provides a way for the LLM agent to expose its reasoning process to the user,
+ * showing how it explores knowledge and reaches conclusions. This makes the
+ * agent's thinking more transparent and allows users to understand the context
+ * behind answers.
+ *
+ * Features:
+ * - Capture and structure the agent's thinking steps
+ * - Visualize reasoning chains for complex queries
+ * - Expose confidence levels for different assertions
+ * - Show how different sources of evidence are weighed
+ */
+
+import log from "../../log.js";
+import aiServiceManager from "../ai_service_manager.js";
+import { AGENT_TOOL_PROMPTS } from '../constants/llm_prompt_constants.js';
+
+/**
+ * Represents a single reasoning step taken by the agent
+ */
+export interface ThinkingStep {
+    id: string;
+    content: string;
+    type: 'observation' | 'hypothesis' | 'question' | 'evidence' | 'conclusion';
+    confidence?: number;
+    sources?: string[];
+    parentId?: string;
+    children?: string[];
+    metadata?: Record<string, unknown>;
+}
+
+/**
+ * Contains the full reasoning process
+ */
+export interface ThinkingProcess {
+    id: string;
+    query: string;
+    steps: ThinkingStep[];
+    status: 'in_progress' | 'completed';
+    startTime: number;
+    endTime?: number;
+}
+
+export class ContextualThinkingTool {
+    private static thinkingCounter = 0;
+    private static stepCounter = 0;
+    private activeProcId?: string;
+    private processes: Record<string, ThinkingProcess> = {};
+
+    /**
+     * Start a new thinking process for a query
+     *
+     * @param query The user's query
+     * @returns The created thinking process ID
+     */
+    startThinking(query: string): string {
+        const thinkingId = `thinking_${Date.now()}_${ContextualThinkingTool.thinkingCounter++}`;
+
+        log.info(`Starting thinking process: ${thinkingId} for query "${query.substring(0, 50)}..."`);
+
+        this.processes[thinkingId] = {
+            id: thinkingId,
+            query,
+            steps: [],
+            status: 'in_progress',
+            startTime: Date.now()
+        };
+
+        // Set as active process
+        this.activeProcId = thinkingId;
+
+        // Initialize with some starter thinking steps
+        this.addThinkingStep(thinkingId, {
+            type: 'observation',
+            content: AGENT_TOOL_PROMPTS.CONTEXTUAL_THINKING.STARTING_ANALYSIS(query)
+        });
+
+        this.addThinkingStep(thinkingId, {
+            type: 'question',
+            content: AGENT_TOOL_PROMPTS.CONTEXTUAL_THINKING.KEY_COMPONENTS
+        });
+
+        this.addThinkingStep(thinkingId, {
+            type: 'observation',
+            content: AGENT_TOOL_PROMPTS.CONTEXTUAL_THINKING.BREAKING_DOWN
+        });
+
+        return thinkingId;
+    }
+
+    /**
+     * Add a thinking step to a process
+     *
+     * @param processId The ID of the process to add to
+     * @param step The thinking step to add
+     * @returns The ID of the added step
+     */
+    addThinkingStep(
+        processId: string,
+        step: Omit<ThinkingStep, 'id'>,
+        parentId?: string
+    ): string {
+        const process = this.processes[processId];
+
+        if (!process) {
+            throw new Error(`Thinking process ${processId} not found`);
+        }
+
+        // Create full step with ID
+        const fullStep: ThinkingStep = {
+            id: `step_${Date.now()}_${Math.floor(Math.random() * 10000)}`,
+            ...step,
+            parentId
+        };
+
+        // Add to process steps
+        process.steps.push(fullStep);
+
+        // If this step has a parent, update the parent's children list
+        if (parentId) {
+            const parentStep = process.steps.find(s => s.id === parentId);
+            if (parentStep) {
+                if (!parentStep.children) {
+                    parentStep.children = [];
+                }
+                parentStep.children.push(fullStep.id);
+            }
+        }
+
+        // Log the step addition with more detail
+        log.info(`Added thinking step to process ${processId}: [${step.type}] ${step.content.substring(0, 100)}...`);
+
+        return fullStep.id;
+    }
+
+    /**
+     * Complete the current thinking process
+     *
+     * @param processId The ID of the process to complete (defaults to active process)
+     * @returns The completed thinking process
+     */
+    completeThinking(processId?: string): ThinkingProcess | null {
+        const id = processId || this.activeProcId;
+
+        if (!id || !this.processes[id]) {
+            log.error(`Thinking process ${id} not found`);
+            return null;
+        }
+
+        this.processes[id].status = 'completed';
+        this.processes[id].endTime = Date.now();
+
+        if (id === this.activeProcId) {
+            this.activeProcId = undefined;
+        }
+
+        return this.processes[id];
+    }
+
+    /**
+     * Get a thinking process by ID
+     */
+    getThinkingProcess(processId: string): ThinkingProcess | null {
+        return this.processes[processId] || null;
+    }
+
+    /**
+     * Get the active thinking process
+     */
+    getActiveThinkingProcess(): ThinkingProcess | null {
+        if (!this.activeProcId) return null;
+        return this.processes[this.activeProcId] || null;
+    }
+
+    /**
+     * Visualize the thinking process as HTML for display in the UI
+     *
+     * @param thinkingId The ID of the thinking process to visualize
+     * @returns HTML representation of the thinking process
+     */
+    visualizeThinking(thinkingId: string): string {
+        log.info(`Visualizing thinking process: thinkingId=${thinkingId}`);
+
+        const process = this.getThinkingProcess(thinkingId);
+        if (!process) {
+            log.info(`No thinking process found for id: ${thinkingId}`);
+            return "<div class='thinking-process'>No thinking process found</div>";
+        }
+
+        log.info(`Found thinking process with ${process.steps.length} steps for query: "${process.query.substring(0, 50)}..."`);
+
+        let html = "<div class='thinking-process'>";
+        html += `<h4>Reasoning Process</h4>`;
+        html += `<div class='thinking-query'>${process.query}</div>`;
+
+        // Show overall time taken for the thinking process
+        const duration = process.endTime ?
+            Math.round((process.endTime - process.startTime) / 1000) :
+            Math.round((Date.now() - process.startTime) / 1000);
+
+        html += `<div class='thinking-meta'>Analysis took ${duration} seconds</div>`;
+
+        // Create a more structured visualization with indentation for parent-child relationships
+        const renderStep = (step: ThinkingStep, level: number = 0) => {
+            const indent = level * 20; // 20px indentation per level
+
+            let stepHtml = `<div class='thinking-step ${step.type || ""}' style='margin-left: ${indent}px'>`;
+
+            // Add an icon based on step type
+            const icon = this.getStepIcon(step.type);
+            stepHtml += `<span class='bx ${icon}'></span> `;
+
+            // Add the step content
+            stepHtml += step.content;
+
+            // Show confidence if available
+            if (step.metadata?.confidence) {
+                const confidence = Math.round((step.metadata.confidence as number) * 100);
+                stepHtml += ` <span class='thinking-confidence'>(Confidence: ${confidence}%)</span>`;
+            }
+
+            // Show sources if available
+            if (step.sources && step.sources.length > 0) {
+                stepHtml += `<div class='thinking-sources'>Sources: ${step.sources.join(', ')}</div>`;
+            }
+
+            stepHtml += `</div>`;
+
+            return stepHtml;
+        };
+
+        // Helper function to render a step and all its children recursively
+        const renderStepWithChildren = (stepId: string, level: number = 0) => {
+            const step = process.steps.find(s => s.id === stepId);
+            if (!step) return '';
+
+            let html = renderStep(step, level);
+
+            if (step.children && step.children.length > 0) {
+                for (const childId of step.children) {
+                    html += renderStepWithChildren(childId, level + 1);
+                }
+            }
+
+            return html;
+        };
+
+        // Render top-level steps and their children
+        const topLevelSteps = process.steps.filter(s => !s.parentId);
+        for (const step of topLevelSteps) {
+            html += renderStep(step);
+
+            if (step.children && step.children.length > 0) {
+                for (const childId of step.children) {
+                    html += renderStepWithChildren(childId, 1);
+                }
+            }
+        }
+
+        html += "</div>";
+        return html;
+    }
+
+    /**
+     * Get an appropriate icon for a thinking step type
+     */
+    private getStepIcon(type: string): string {
+        switch (type) {
+            case 'observation':
+                return 'bx-search';
+            case 'hypothesis':
+                return 'bx-bulb';
+            case 'evidence':
+                return 'bx-list-check';
+            case 'conclusion':
+                return 'bx-check-circle';
+            default:
+                return 'bx-message-square-dots';
+        }
+    }
+
+    /**
+     * Get a plain text summary of the thinking process
+     *
+     * @param thinkingId The ID of the thinking process to summarize
+     * @returns Text summary of the thinking process
+     */
+    getThinkingSummary(thinkingId: string): string {
+        const process = this.getThinkingProcess(thinkingId);
+        if (!process) {
+            log.error(`No thinking process found for id: ${thinkingId}`);
+            return "No thinking process available.";
+        }
+
+        let summary = `## Reasoning Process for Query: "${process.query}"\n\n`;
+
+        // Group steps by type for better organization
+        const observations = process.steps.filter(s => s.type === 'observation');
+        const questions = process.steps.filter(s => s.type === 'question');
+        const hypotheses = process.steps.filter(s => s.type === 'hypothesis');
+        const evidence = process.steps.filter(s => s.type === 'evidence');
+        const conclusions = process.steps.filter(s => s.type === 'conclusion');
+
+        log.info(`Generating thinking summary with: ${observations.length} observations, ${questions.length} questions, ${hypotheses.length} hypotheses, ${evidence.length} evidence, ${conclusions.length} conclusions`);
+
+        // Add observations
+        if (observations.length > 0) {
+            summary += "### Observations:\n";
+            observations.forEach(step => {
+                summary += `- ${step.content}\n`;
+            });
+            summary += "\n";
+        }
+
+        // Add questions
+        if (questions.length > 0) {
+            summary += "### Questions Considered:\n";
+            questions.forEach(step => {
+                summary += `- ${step.content}\n`;
+            });
+            summary += "\n";
+        }
+
+        // Add hypotheses
+        if (hypotheses.length > 0) {
+            summary += "### Hypotheses:\n";
+            hypotheses.forEach(step => {
+                summary += `- ${step.content}\n`;
+            });
+            summary += "\n";
+        }
+
+        // Add evidence
+        if (evidence.length > 0) {
+            summary += "### Evidence Gathered:\n";
+            evidence.forEach(step => {
+                summary += `- ${step.content}\n`;
+            });
+            summary += "\n";
+        }
+
+        // Add conclusions
+        if (conclusions.length > 0) {
+            summary += "### Conclusions:\n";
+            conclusions.forEach(step => {
+                summary += `- ${step.content}\n`;
+            });
+            summary += "\n";
+        }
+
+        log.info(`Generated thinking summary with ${summary.length} characters`);
+        return summary;
+    }
+
+    /**
+     * Reset the active thinking process
+     */
+    resetActiveThinking(): void {
+        this.activeProcId = undefined;
+    }
+
+    /**
+     * Generate a unique ID for a thinking process
+     */
+    private generateProcessId(): string {
+        return `thinking_${Date.now()}_${ContextualThinkingTool.thinkingCounter++}`;
+    }
+
+    /**
+     * Generate a unique ID for a thinking step
+     */
+    private generateStepId(): string {
+        return `step_${Date.now()}_${ContextualThinkingTool.stepCounter++}`;
+    }
+
+    /**
+     * Format duration between two timestamps
+     */
+    private formatDuration(start: number, end: number): string {
+        const durationMs = end - start;
+        if (durationMs < 1000) {
+            return `${durationMs}ms`;
+        } else if (durationMs < 60000) {
+            return `${Math.round(durationMs / 1000)}s`;
+        } else {
+            return `${Math.round(durationMs / 60000)}m ${Math.round((durationMs % 60000) / 1000)}s`;
+        }
+    }
+
+    /**
+     * Recursively render a step and its children
+     */
+    private renderStepTree(step: ThinkingStep, allSteps: ThinkingStep[]): string {
+        const typeIcons: Record<string, string> = {
+            'observation': '🔍',
+            'hypothesis': '🤔',
+            'question': '❓',
+            'evidence': '📋',
+            'conclusion': '✅'
+        };
+
+        const icon = typeIcons[step.type] || '•';
+        const confidenceDisplay = step.confidence !== undefined
+            ? `<span class="confidence">${Math.round(step.confidence * 100)}%</span>`
+            : '';
+
+        let html = `
+      <div class="thinking-step thinking-${step.type}">
+        <div class="step-header">
+          <span class="step-icon">${icon}</span>
+          <span class="step-type">${step.type}</span>
+          ${confidenceDisplay}
+        </div>
+        <div class="step-content">${step.content}</div>
+    `;
+
+        // Add sources if available
+        if (step.sources && step.sources.length > 0) {
+            html += `<div class="step-sources">Sources: ${step.sources.join(', ')}</div>`;
+        }
+
+        // Recursively render children
+        if (step.children && step.children.length > 0) {
+            html += `<div class="step-children">`;
+
+            for (const childId of step.children) {
+                const childStep = allSteps.find(s => s.id === childId);
+                if (childStep) {
+                    html += this.renderStepTree(childStep, allSteps);
+                }
+            }
+
+            html += `</div>`;
+        }
+
+        html += `</div>`;
+        return html;
+    }
+}
+
+export default ContextualThinkingTool;
diff --git a/src/services/llm/context_extractors/index.ts b/src/services/llm/context_extractors/index.ts
new file mode 100644
index 000000000..bbb0861ea
--- /dev/null
+++ b/src/services/llm/context_extractors/index.ts
@@ -0,0 +1,125 @@
+/**
+ * Context Extractors Module
+ *
+ * Provides tools for extracting context from notes, files, and other sources.
+ */
+
+import { ContextualThinkingTool } from './contextual_thinking_tool.js';
+import { NoteNavigatorTool } from './note_navigator_tool.js';
+import { QueryDecompositionTool } from './query_decomposition_tool.js';
+import { VectorSearchTool } from './vector_search_tool.js';
+
+// Import services needed for initialization
+import contextService from '../context/services/context_service.js';
+import log from '../../log.js';
+
+// Import interfaces
+import type {
+  IContextualThinkingTool,
+  INoteNavigatorTool,
+  IQueryDecompositionTool,
+  IVectorSearchTool
+} from '../interfaces/agent_tool_interfaces.js';
+
+/**
+ * Agent Tools Manager
+ *
+ * Manages and provides access to all available agent tools.
+ */
+class AgentToolsManager {
+  private vectorSearchTool: VectorSearchTool | null = null;
+  private noteNavigatorTool: NoteNavigatorTool | null = null;
+  private queryDecompositionTool: QueryDecompositionTool | null = null;
+  private contextualThinkingTool: ContextualThinkingTool | null = null;
+  private initialized = false;
+
+  /**
+   * Initialize all tools
+   */
+  async initialize(forceInit = false): Promise<void> {
+    if (this.initialized && !forceInit) {
+      return;
+    }
+
+    try {
+      log.info("Initializing agent tools");
+
+      // Initialize the context service first
+      try {
+        await contextService.initialize();
+      } catch (error) {
+        log.error(`Error initializing context service: ${error}`);
+        // Continue anyway, some tools might work without the context service
+      }
+
+      // Create tool instances
+      this.vectorSearchTool = new VectorSearchTool();
+      this.noteNavigatorTool = new NoteNavigatorTool();
+      this.queryDecompositionTool = new QueryDecompositionTool();
+      this.contextualThinkingTool = new ContextualThinkingTool();
+
+      // Set context service in the vector search tool
+      if (this.vectorSearchTool) {
+        this.vectorSearchTool.setContextService(contextService);
+      }
+
+      this.initialized = true;
+      log.info("Agent tools initialized successfully");
+    } catch (error) {
+      log.error(`Failed to initialize agent tools: ${error}`);
+      throw error;
+    }
+  }
+
+  /**
+   * Get all available tools
+   */
+  getAllTools() {
+    return [
+      {
+        name: "vector_search",
+        description: "Searches your notes for semantically similar content",
+        function: this.vectorSearchTool?.search.bind(this.vectorSearchTool)
+      },
+      {
+        name: "navigate_to_note",
+        description: "Navigates to a specific note",
+        function: this.noteNavigatorTool?.getNoteInfo.bind(this.noteNavigatorTool)
+      },
+      {
+        name: "decompose_query",
+        description: "Breaks down a complex query into simpler sub-queries",
+        function: this.queryDecompositionTool?.decomposeQuery.bind(this.queryDecompositionTool)
+      },
+      {
+        name: "contextual_thinking",
+        description: "Provides structured thinking about a problem using available context",
+        function: this.contextualThinkingTool?.startThinking.bind(this.contextualThinkingTool)
+      }
+    ].filter(tool => tool.function !== undefined);
+  }
+
+  /**
+   * Get all tool objects (for direct access)
+   */
+  getTools() {
+    return {
+      vectorSearch: this.vectorSearchTool as IVectorSearchTool,
+      noteNavigator: this.noteNavigatorTool as INoteNavigatorTool,
+      queryDecomposition: this.queryDecompositionTool as IQueryDecompositionTool,
+      contextualThinking: this.contextualThinkingTool as IContextualThinkingTool
+    };
+  }
+}
+
+// Create and export singleton instance
+const agentTools = new AgentToolsManager();
+export default agentTools;
+
+// Export all tools for direct import if needed
+export {
+  VectorSearchTool,
+  NoteNavigatorTool,
+  QueryDecompositionTool,
+  ContextualThinkingTool
+};
diff --git a/src/services/llm/context_extractors/note_navigator_tool.ts b/src/services/llm/context_extractors/note_navigator_tool.ts
new file mode 100644
index 000000000..65d980624
--- /dev/null
+++ b/src/services/llm/context_extractors/note_navigator_tool.ts
@@ -0,0 +1,650 @@
+/**
+ * Note Structure Navigator Tool
+ *
+ * This tool enables the LLM agent to navigate through the hierarchical
+ * structure of notes in the knowledge base. It provides methods for:
+ * - Finding paths between notes
+ * - Exploring parent-child relationships
+ * - Discovering note attributes and metadata
+ * - Understanding the context of a note within the broader structure
+ *
+ * This helps the LLM agent provide more accurate and contextually relevant responses.
+ */
+
+import becca from '../../../becca/becca.js';
+import log from '../../log.js';
+import type BNote from '../../../becca/entities/bnote.js';
+import type BAttribute from '../../../becca/entities/battribute.js';
+import sql from "../../sql.js";
+import { SEARCH_CONSTANTS } from "../constants/search_constants.js";
+
+export interface NoteInfo {
+  noteId: string;
+  title: string;
+  type: string;
+  mime?: string;
+  dateCreated?: string;
+  dateModified?: string;
+  isProtected: boolean;
+  isArchived: boolean;
+  attributeNames: string[];
+  hasChildren: boolean;
+}
+
+export interface NotePathInfo {
+  notePath: string[];
+  notePathTitles: string[];
+}
+
+export interface NoteHierarchyLevel {
+  noteId: string;
+  title: string;
+  level: number;
+  children?: NoteHierarchyLevel[];
+}
+
+interface NoteStructure {
+  noteId: string;
+  title: string;
+  type: string;
+  childCount: number;
+  attributes: Array<{name: string, value: string}>;
+  parentPath: Array<{title: string, noteId: string}>;
+}
+
+export class NoteNavigatorTool {
+  private maxPathLength: number = SEARCH_CONSTANTS.HIERARCHY.MAX_PATH_LENGTH;
+  private maxBreadth: number = SEARCH_CONSTANTS.HIERARCHY.MAX_BREADTH;
+  private maxDepth: number = SEARCH_CONSTANTS.HIERARCHY.MAX_DEPTH;
+
+  /**
+   * Error handler that properly types the error object
+   */
+  private handleError(error: unknown): string {
+    if (error instanceof Error) {
+      return error.message || String(error);
+    }
+    return String(error);
+  }
+
+  /**
+   * Get detailed information about a note
+   */
+  getNoteInfo(noteId: string): NoteInfo | null {
+    try {
+      const note = becca.notes[noteId];
+      if (!note) {
+        return null;
+      }
+
+      // Get attribute names for this note
+      const attributeNames = note.ownedAttributes
+        .map(attr => attr.name)
+        .filter((value, index, self) => self.indexOf(value) === index); // unique values
+
+      return {
+        noteId: note.noteId,
+        title: note.title,
+        type: note.type,
+        mime: note.mime,
+        dateCreated: note.dateCreated,
+        dateModified: note.dateModified,
+        isProtected: note.isProtected ?? false,
+        isArchived: note.isArchived || false,
+        attributeNames,
+        hasChildren: note.children.length > 0
+      };
+    } catch (error: unknown) {
+      log.error(`Error getting note info: ${this.handleError(error)}`);
+      return null;
+    }
+  }
+
+  /**
+   * Get all paths to a note from the root
+   */
+  getNotePathsFromRoot(noteId: string): NotePathInfo[] {
+    try {
+      const note = becca.notes[noteId];
+      if (!note) {
+        return [];
+      }
+
+      // Get all possible paths to this note
+      const allPaths = note.getAllNotePaths();
+      if (!allPaths || allPaths.length === 0) {
+        return [];
+      }
+
+      // Convert path IDs to titles
+      return allPaths.map(path => {
+        const titles = path.map(id => {
+          const pathNote = becca.notes[id];
+          return pathNote ? pathNote.title : id;
+        });
+
+        return {
+          notePath: path,
+          notePathTitles: titles
+        };
+      }).sort((a, b) => a.notePath.length - b.notePath.length); // Sort by path length, shortest first
+    } catch (error: unknown) {
+      log.error(`Error getting note paths: ${this.handleError(error)}`);
+      return [];
+    }
+  }
+
+  /**
+   * Get a note's hierarchy (children up to specified depth)
+   * This is useful for the LLM to understand the structure within a note's subtree
+   */
+  getNoteHierarchy(noteId: string, depth: number = 2): NoteHierarchyLevel | null {
+    if (depth < 0 || depth > this.maxDepth) {
+      depth = this.maxDepth;
+    }
+
+    try {
+      const note = becca.notes[noteId];
+      if (!note) {
+        return null;
+      }
+
+      const result: NoteHierarchyLevel = {
+        noteId: note.noteId,
+        title: note.title,
+        level: 0
+      };
+
+      // Recursively get children if depth allows
+      if (depth > 0 && note.children.length > 0) {
+        result.children = note.children
+          .slice(0, this.maxBreadth)
+          .map(child => this._getHierarchyLevel(child.noteId, 1, depth))
+          .filter((node): node is NoteHierarchyLevel => node !== null);
+      }
+
+      return result;
+    } catch (error: unknown) {
+      log.error(`Error getting note hierarchy: ${this.handleError(error)}`);
+      return null;
+    }
+  }
+
+  /**
+   * Recursive helper for getNoteHierarchy
+   */
+  private _getHierarchyLevel(noteId: string, currentLevel: number, maxDepth: number): NoteHierarchyLevel | null {
+    try {
+      const note = becca.notes[noteId];
+      if (!note) {
+        return null;
+      }
+
+      const result: NoteHierarchyLevel = {
+        noteId: note.noteId,
+        title: note.title,
+        level: currentLevel
+      };
+
+      // Recursively get children if depth allows
+      if (currentLevel < maxDepth && note.children.length > 0) {
+        result.children = note.children
+          .slice(0, this.maxBreadth)
+          .map(child => this._getHierarchyLevel(child.noteId, currentLevel + 1, maxDepth))
+          .filter((node): node is NoteHierarchyLevel => node !== null);
+      }
+
+      return result;
+    } catch (error: unknown) {
+      log.error(`Error in _getHierarchyLevel: ${this.handleError(error)}`);
+      return null;
+    }
+  }
+
+  /**
+   * Get attributes of a note
+   */
+  getNoteAttributes(noteId: string): BAttribute[] {
+    try {
+      const note = becca.notes[noteId];
+      if (!note) {
+        return [];
+      }
+
+      return note.ownedAttributes;
+    } catch (error: unknown) {
+      log.error(`Error getting note attributes: ${this.handleError(error)}`);
+      return [];
+    }
+  }
+
+  /**
+   * Find the shortest path between two notes
+   */
+  findPathBetweenNotes(fromNoteId: string, toNoteId: string): NotePathInfo | null {
+    try {
+      if (fromNoteId === toNoteId) {
+        const note = becca.notes[fromNoteId];
+        if (!note) return null;
+
+        return {
+          notePath: [fromNoteId],
+          notePathTitles: [note.title]
+        };
+      }
+
+      // Simple breadth-first search to find shortest path
+      const visited = new Set<string>();
+      const queue: Array<{noteId: string, path: string[], titles: string[]}> = [];
+
+      // Initialize with the starting note
+      const startNote = becca.notes[fromNoteId];
+      if (!startNote) return null;
+
+      queue.push({
+        noteId: fromNoteId,
+        path: [fromNoteId],
+        titles: [startNote.title]
+      });
+
+      visited.add(fromNoteId);
+
+      while (queue.length > 0 && queue[0].path.length <= this.maxPathLength) {
+        const {noteId, path, titles} = queue.shift()!;
+        const note = becca.notes[noteId];
+
+        if (!note) continue;
+
+        // Get IDs of all connected notes (parents and children)
+        const connections: string[] = [
+          ...note.parents.map(p => p.noteId),
+          ...note.children.map(c => c.noteId)
+        ];
+
+        for (const connectedId of connections) {
+          if (visited.has(connectedId)) continue;
+
+          const connectedNote = becca.notes[connectedId];
+          if (!connectedNote) continue;
+
+          const newPath = [...path, connectedId];
+          const newTitles = [...titles, connectedNote.title];
+
+          // Check if we found the target
+          if (connectedId === toNoteId) {
+            return {
+              notePath: newPath,
+              notePathTitles: newTitles
+            };
+          }
+
+          // Continue BFS
+          queue.push({
+            noteId: connectedId,
+            path: newPath,
+            titles: newTitles
+          });
+
+          visited.add(connectedId);
+        }
+      }
+
+      // No path found
+      return null;
+    } catch (error: unknown) {
+      log.error(`Error finding path between notes: ${this.handleError(error)}`);
+      return null;
+    }
+  }
+
+  /**
+   * Search for notes by title
+   */
+  searchNotesByTitle(searchTerm: string, limit: number = SEARCH_CONSTANTS.HIERARCHY.MAX_NOTES_PER_QUERY): NoteInfo[] {
+    try {
+      if (!searchTerm || searchTerm.trim().length === 0) {
+        return [];
+      }
+
+      searchTerm = searchTerm.toLowerCase();
+      const results: NoteInfo[] = [];
+
+      // Simple in-memory search through all notes
+      for (const noteId in becca.notes) {
+        if (results.length >= limit) break;
+
+        const note = becca.notes[noteId];
+        if (!note || note.isDeleted) continue;
+
+        if (note.title.toLowerCase().includes(searchTerm)) {
+          const info = this.getNoteInfo(noteId);
+          if (info) results.push(info);
+        }
+      }
+
+      return results;
+    } catch (error: unknown) {
+      log.error(`Error searching notes by title: ${this.handleError(error)}`);
+      return [];
+    }
+  }
+
+  /**
+   * Get clones of a note (if any)
+   */
+  async getNoteClones(noteId: string): Promise<NoteInfo[]> {
+    try {
+      const note = becca.notes[noteId];
+      if (!note) {
+        return [];
+      }
+
+      // A note has clones if it has multiple parents
+      if (note.parents.length <= 1) {
+        return [];
+      }
+
+      // Return parent notes, which represent different contexts for this note
+      const parents = await this.getParentNotes(noteId);
+      return parents
+        .map(parent => this.getNoteInfo(parent.noteId))
+        .filter((info): info is NoteInfo => info !== null);
+    } catch (error: unknown) {
+      log.error(`Error getting note clones: ${this.handleError(error)}`);
+      return [];
+    }
+  }
+
+  /**
+   * Generate a readable overview of a note's position in the hierarchy
+   * This is useful for the LLM to understand the context of a note
+   */
+  async getNoteContextDescription(noteId: string): Promise<string> {
+    try {
+      const note = becca.notes[noteId];
+      if (!note) {
+        return "Note not found.";
+      }
+
+      const paths = this.getNotePathsFromRoot(noteId);
+      if (paths.length === 0) {
+        return `Note "${note.title}" exists but has no path from root.`;
+      }
+
+      let result = "";
+
+      // Basic note info
+      result += `Note: "${note.title}" (${note.type})\n`;
+
+      // Is it cloned?
+      if (paths.length > 1) {
+        result += `This note appears in ${paths.length} different locations:\n`;
+
+        // Show max paths to avoid overwhelming context
+        for (let i = 0; i < Math.min(SEARCH_CONSTANTS.HIERARCHY.MAX_PATHS_TO_SHOW, paths.length); i++) {
+          const path = paths[i];
+          result += `${i+1}. ${path.notePathTitles.join(' > ')}\n`;
+        }
+
+        if (paths.length > SEARCH_CONSTANTS.HIERARCHY.MAX_PATHS_TO_SHOW) {
+          result += `... and ${paths.length - SEARCH_CONSTANTS.HIERARCHY.MAX_PATHS_TO_SHOW} more locations\n`;
+        }
+      } else {
+        // Just one path
+        const path = paths[0];
+        result += `Path: ${path.notePathTitles.join(' > ')}\n`;
+      }
+
+      // Children info using the async function
+      const children = await this.getChildNotes(noteId, SEARCH_CONSTANTS.CONTEXT.MAX_POINTS);
+
+      if (children.length > 0) {
+        result += `\nContains ${note.children.length} child notes`;
+        if (children.length < note.children.length) {
+          result += ` (showing first ${children.length})`;
+        }
+        result += `:\n`;
+
+        for (const child of children) {
+          result += `- ${child.title}\n`;
+        }
+
+        if (children.length < note.children.length) {
+          result += `... and ${note.children.length - children.length} more\n`;
+        }
+      } else {
+        result += "\nThis note has no child notes.\n";
+      }
+
+      // Attributes summary
+      const attributes = this.getNoteAttributes(noteId);
+      if (attributes.length > 0) {
+        result += `\nNote has ${attributes.length} attributes.\n`;
+
+        // Group attributes by name
+        const attrMap: Record<string, string[]> = {};
+        for (const attr of attributes) {
+          if (!attrMap[attr.name]) {
+            attrMap[attr.name] = [];
+          }
+          attrMap[attr.name].push(attr.value);
+        }
+
+        for (const [name, values] of Object.entries(attrMap)) {
+          if (values.length === 1) {
+            result += `- ${name}: ${values[0]}\n`;
+          } else {
+            result += `- ${name}: ${values.length} values\n`;
+          }
+        }
+      }
+
+      return result;
+    } catch (error: unknown) {
+      log.error(`Error getting note context: ${this.handleError(error)}`);
+      return "Error generating note context description.";
+    }
+  }
+
+  /**
+   * Get the structure of a note including its hierarchy and attributes
+   *
+   * @param noteId The ID of the note to get structure for
+   * @returns Structure information about the note
+   */
+  async getNoteStructure(noteId: string): Promise<NoteStructure> {
+    try {
+      log.info(`Getting note structure for note ${noteId}`);
+
+      // Special handling for 'root' or other special notes
+      if (noteId === 'root' || !noteId) {
+        log.info('Using root as the special note for structure');
+        return {
+          noteId: 'root',
+          title: 'Root',
+          type: 'root',
+          childCount: 0, // We don't know how many direct children root has
+          attributes: [],
+          parentPath: []
+        };
+      }
+
+      // Get the note from becca
+      const note = becca.notes[noteId];
+
+      if (!note) {
+        log.error(`Note ${noteId} not found in becca.notes`);
+        return {
+          noteId,
+          title: 'Unknown',
+          type: 'unknown',
+          childCount: 0,
+          attributes: [],
+          parentPath: []
+        };
+      }
+
+      // Get child notes count
+      const childCount = note.children.length;
+
+      // Get attributes
+      const attributes = note.getAttributes().map(attr => ({
+        name: attr.name,
+        value: attr.value
+      }));
+
+      // Build parent path
+      const parentPath: Array<{title: string, noteId: string}> = [];
+      let current = note.parents[0]; // Get first parent
+
+      while (current && current.noteId !== 'root') {
+        parentPath.unshift({
+          title: current.title,
+          noteId: current.noteId
+        });
+
+        current = current.parents[0];
+      }
+
+      return {
+        noteId: note.noteId,
+        title: note.title,
+        type: note.type,
+        childCount,
+        attributes,
+        parentPath
+      };
+    } catch (error: unknown) {
+      log.error(`Error getting note structure: ${this.handleError(error)}`);
+      // Return a minimal structure with empty arrays to avoid null errors
+      return {
+        noteId,
+        title: 'Unknown',
+        type: 'unknown',
+        childCount: 0,
+        attributes: [],
+        parentPath: []
+      };
+    }
+  }
+
+  /**
+   * Get child notes of a specified note
+   */
+  async getChildNotes(noteId: string, limit: number = SEARCH_CONSTANTS.CONTEXT.MAX_CHILDREN): Promise<Array<{noteId: string, title: string}>> {
+    try {
+      const note = becca.notes[noteId];
+
+      if (!note) {
+        throw new Error(`Note ${noteId} not found`);
+      }
+
+      return note.children
+        .slice(0, limit)
+        .map(child => ({
+          noteId: child.noteId,
+          title: child.title
+        }));
+    } catch (error: unknown) {
+      log.error(`Error getting child notes: ${this.handleError(error)}`);
+      return [];
+    }
+  }
+
+  /**
+   * Get parent notes of a specified note
+   */
+  async getParentNotes(noteId: string): Promise<Array<{noteId: string, title: string}>> {
+    try {
+      const note = becca.notes[noteId];
+
+      if (!note) {
+        throw new Error(`Note ${noteId} not found`);
+      }
+
+      return note.parents.map(parent => ({
+        noteId: parent.noteId,
+        title: parent.title
+      }));
+    } catch (error: unknown) {
+      log.error(`Error getting parent notes: ${this.handleError(error)}`);
+      return [];
+    }
+  }
+
+  /**
+   * Find notes linked to/from the specified note
+   */
+  async getLinkedNotes(noteId: string, limit: number = SEARCH_CONSTANTS.CONTEXT.MAX_LINKS): Promise<Array<{noteId: string, title: string, direction: 'from'|'to'}>> {
+    try {
+      const note = becca.notes[noteId];
+
+      if (!note) {
+        throw new Error(`Note ${noteId} not found`);
+      }
+
+      // Links from this note to others
+      const outboundLinks = note.getRelations()
+        .slice(0, Math.floor(limit / 2))
+        .map(relation => ({
+          noteId: relation.targetNoteId || '', // Ensure noteId is never undefined
+          title: relation.name,
+          direction: 'to' as const
+        }))
+        .filter(link => link.noteId !== ''); // Filter out any with empty noteId
+
+      // Links from other notes to this one
+      const inboundLinks: Array<{noteId: string, title: string, direction: 'from'}> = [];
+
+      // Find all notes that have relations pointing to this note
+      for (const relatedNoteId in becca.notes) {
+        const relatedNote = becca.notes[relatedNoteId];
+        if (relatedNote && !relatedNote.isDeleted) {
+          const relations = relatedNote.getRelations();
+          for (const relation of relations) {
+            if (relation.targetNoteId === noteId) {
+              inboundLinks.push({
+                noteId: relatedNote.noteId,
+                title: relation.name,
+                direction: 'from'
+              });
+
+              // Break if we've found enough inbound links
+              if (inboundLinks.length >= Math.floor(limit / 2)) {
+                break;
+              }
+            }
+          }
+
+          // Break if we've found enough inbound links
+          if (inboundLinks.length >= Math.floor(limit / 2)) {
+            break;
+          }
+        }
+      }
+
+      return [...outboundLinks, ...inboundLinks.slice(0, Math.floor(limit / 2))];
+    } catch (error: unknown) {
+      log.error(`Error getting linked notes: ${this.handleError(error)}`);
+      return [];
+    }
+  }
+
+  /**
+   * Get the full path of a note from root
+   */
+  async getNotePath(noteId: string): Promise<string> {
+    try {
+      const structure = await this.getNoteStructure(noteId);
+      const path = structure.parentPath.map(p => p.title);
+      path.push(structure.title);
+
+      return path.join(' > ');
+    } catch (error: unknown) {
+      log.error(`Error getting note path: ${this.handleError(error)}`);
+      return 'Unknown path';
+    }
+  }
+}
+
+export default NoteNavigatorTool;
diff --git a/src/services/llm/context_extractors/query_decomposition_tool.ts b/src/services/llm/context_extractors/query_decomposition_tool.ts
new file mode 100644
index 000000000..2e65ada76
--- /dev/null
+++ b/src/services/llm/context_extractors/query_decomposition_tool.ts
@@ -0,0 +1,522 @@
+/**
+ * Query Decomposition Tool
+ *
+ * This tool helps the LLM agent break down complex user queries into
+ * sub-questions that can be answered individually and then synthesized
+ * into a comprehensive response.
+ *
+ * Features:
+ * - Analyze query complexity
+ * - Extract multiple intents from a single question
+ * - Create a multi-stage research plan
+ * - Track progress through complex information gathering
+ */
+
+import log from '../../log.js';
+import { AGENT_TOOL_PROMPTS } from '../constants/llm_prompt_constants.js';
+
+export interface SubQuery {
+    id: string;
+    text: string;
+    reason: string;
+    isAnswered: boolean;
+    answer?: string;
+}
+
+export interface DecomposedQuery {
+    originalQuery: string;
+    subQueries: SubQuery[];
+    status: 'pending' | 'in_progress' | 'completed';
+    complexity: number;
+}
+
+export class QueryDecompositionTool {
+    private static queryCounter: number = 0;
+
+    /**
+     * Break down a complex query into smaller, more manageable sub-queries
+     *
+     * @param query The original user query
+     * @param context Optional context about the current note being viewed
+     * @returns A decomposed query object with sub-queries
+     */
+    decomposeQuery(query: string, context?: string): DecomposedQuery {
+        try {
+            // Log the decomposition attempt for tracking
+            log.info(`Decomposing query: "${query.substring(0, 100)}..."`);
+
+            if (!query || query.trim().length === 0) {
+                log.info("Query decomposition called with empty query");
+                return {
+                    originalQuery: query,
+                    subQueries: [],
+                    status: 'pending',
+                    complexity: 0
+                };
+            }
+
+            // Assess query complexity to determine if decomposition is needed
+            const complexity = this.assessQueryComplexity(query);
+            log.info(`Query complexity assessment: ${complexity}/10`);
+
+            // For simple queries, just return the original as a single sub-query
+            // Use a lower threshold (2 instead of 3) to decompose more queries
+            if (complexity < 2) {
+                log.info(`Query is simple (complexity ${complexity}), returning as single sub-query`);
+
+                const mainSubQuery = {
+                    id: this.generateSubQueryId(),
+                    text: query,
+                    reason: AGENT_TOOL_PROMPTS.QUERY_DECOMPOSITION.SUB_QUERY_DIRECT,
+                    isAnswered: false
+                };
+
+                // Still add a generic exploration query to get some related content
+                const genericQuery = {
+                    id: this.generateSubQueryId(),
+                    text: `Information related to ${query}`,
+                    reason: AGENT_TOOL_PROMPTS.QUERY_DECOMPOSITION.SUB_QUERY_GENERIC,
+                    isAnswered: false
+                };
+
+                return {
+                    originalQuery: query,
+                    subQueries: [mainSubQuery, genericQuery],
+                    status: 'pending',
+                    complexity
+                };
+            }
+
+            // For complex queries, perform decomposition
+            const subQueries = this.createSubQueries(query, context);
+            log.info(`Decomposed query into ${subQueries.length} sub-queries`);
+
+            // Log the sub-queries for better visibility
+            subQueries.forEach((sq, index) => {
+                log.info(`Sub-query ${index + 1}: "${sq.text}" - Reason: ${sq.reason}`);
+            });
+
+            return {
+                originalQuery: query,
+                subQueries,
+                status: 'pending',
+                complexity
+            };
+        } catch (error: any) {
+            log.error(`Error decomposing query: ${error.message}`);
+
+            // Fallback to treating it as a simple query
+            return {
+                originalQuery: query,
+                subQueries: [{
+                    id: this.generateSubQueryId(),
+                    text: query,
+                    reason: AGENT_TOOL_PROMPTS.QUERY_DECOMPOSITION.SUB_QUERY_ERROR,
+                    isAnswered: false
+                }],
+                status: 'pending',
+                complexity: 1
+            };
+        }
+    }
+
+    /**
+     * Update a sub-query with its answer
+     *
+     * @param decomposedQuery The decomposed query object
+     * @param subQueryId The ID of the sub-query to update
+     * @param answer The answer to the sub-query
+     * @returns The updated decomposed query
+     */
+    updateSubQueryAnswer(
+        decomposedQuery: DecomposedQuery,
+        subQueryId: string,
+        answer: string
+    ): DecomposedQuery {
+        const updatedSubQueries = decomposedQuery.subQueries.map(sq => {
+            if (sq.id === subQueryId) {
+                return {
+                    ...sq,
+                    answer,
+                    isAnswered: true
+                };
+            }
+            return sq;
+        });
+
+        // Check if all sub-queries are answered
+        const allAnswered = updatedSubQueries.every(sq => sq.isAnswered);
+
+        return {
+            ...decomposedQuery,
+            subQueries: updatedSubQueries,
+            status: allAnswered ? 'completed' : 'in_progress'
+        };
+    }
+
+    /**
+     * Synthesize all sub-query answers into a comprehensive response
+     *
+     * @param decomposedQuery The decomposed query with all sub-queries answered
+     * @returns A synthesized answer to the original query
+     */
+    synthesizeAnswer(decomposedQuery: DecomposedQuery): string {
+        try {
+            // Ensure all sub-queries are answered
+            if (!decomposedQuery.subQueries.every(sq => sq.isAnswered)) {
+                return "Cannot synthesize answer - not all sub-queries have been answered.";
+            }
+
+            // For simple queries with just one sub-query, return the answer directly
+            if (decomposedQuery.subQueries.length === 1) {
+                return decomposedQuery.subQueries[0].answer || "";
+            }
+
+            // For complex queries, build a structured response that references each sub-answer
+            let synthesized = `Answer to: "${decomposedQuery.originalQuery}"\n\n`;
+
+            // Group by themes if there are many sub-queries
+            if (decomposedQuery.subQueries.length > 3) {
+                // Here we would ideally group related sub-queries, but for now we'll just present them in order
+                synthesized += "Based on the information gathered:\n\n";
+
+                for (const sq of decomposedQuery.subQueries) {
+                    synthesized += `${sq.answer}\n\n`;
+                }
+            } else {
+                // For fewer sub-queries, present each one with its question
+                for (const sq of decomposedQuery.subQueries) {
+                    synthesized += `${sq.answer}\n\n`;
+                }
+            }
+
+            return synthesized.trim();
+        } catch (error: any) {
+            log.error(`Error synthesizing answer: ${error.message}`);
+            return "Error synthesizing the final answer.";
+        }
+    }
+
+    /**
+     * Generate a status report on the progress of answering a complex query
+     *
+     * @param decomposedQuery The decomposed query
+     * @returns A status report string
+     */
+    getQueryStatus(decomposedQuery: DecomposedQuery): string {
+        const answeredCount = decomposedQuery.subQueries.filter(sq => sq.isAnswered).length;
+        const totalCount = decomposedQuery.subQueries.length;
+
+        let status = `Progress: ${answeredCount}/${totalCount} sub-queries answered\n\n`;
+
+        for (const sq of decomposedQuery.subQueries) {
+            status += `${sq.isAnswered ? '✓' : '○'} ${sq.text}\n`;
+            if (sq.isAnswered) {
+                status += `   Answer: ${this.truncateText(sq.answer || "", 100)}\n`;
+            }
+        }
+
+        return status;
+    }
+
+    /**
+     * Assess the complexity of a query on a scale of 1-10
+     * This helps determine how many sub-queries are needed
+     *
+     * @param query The query to assess
+     * @returns A complexity score from 1-10
+     */
+    assessQueryComplexity(query: string): number {
+        // Count the number of question marks as a basic indicator
+        const questionMarkCount = (query.match(/\?/g) || []).length;
+
+        // Count potential sub-questions based on question words
+        const questionWords = ['what', 'how', 'why', 'where', 'when', 'who', 'which'];
+        const questionWordMatches = questionWords.map(word => {
+            const regex = new RegExp(`\\b${word}\\b`, 'gi');
+            return (query.match(regex) || []).length;
+        });
+
+        const questionWordCount = questionWordMatches.reduce((sum, count) => sum + count, 0);
+
+        // Look for conjunctions which might join multiple questions
+        const conjunctionCount = (query.match(/\b(and|or|but|as well as)\b/gi) || []).length;
+
+        // Look for complex requirements
+        const comparisonCount = (query.match(/\b(compare|versus|vs|difference|similarities?)\b/gi) || []).length;
+        const analysisCount = (query.match(/\b(analyze|examine|investigate|explore|explain|discuss)\b/gi) || []).length;
+
+        // Calculate base complexity
+        let complexity = 1;
+
+        // Add for multiple questions
+        complexity += Math.min(2, questionMarkCount);
+
+        // Add for question words beyond the first one
+        complexity += Math.min(2, Math.max(0, questionWordCount - 1));
+
+        // Add for conjunctions that might join questions
+        complexity += Math.min(2, conjunctionCount);
+
+        // Add for comparative/analytical requirements
+        complexity += Math.min(2, comparisonCount + analysisCount);
+
+        // Add for overall length/complexity
+        if (query.length > 100) complexity += 1;
+        if (query.length > 200) complexity += 1;
+
+        // Ensure we stay in the 1-10 range
+        return Math.max(1, Math.min(10, complexity));
+    }
+
+    /**
+     * Generate a unique ID for a sub-query
+     */
+    generateSubQueryId(): string {
+        return `sq_${Date.now()}_${Math.floor(Math.random() * 10000)}`;
+    }
+
+    /**
+     * Create sub-queries based on the original query
+     */
+    createSubQueries(query: string, context?: string): SubQuery[] {
+        // Simple rules to create sub-queries based on query content
+        const subQueries: SubQuery[] = [];
+
+        // Avoid creating subqueries that start with "Provide details about" or similar
+        // as these have been causing recursive loops
+        if (query.toLowerCase().includes("provide details about") ||
+            query.toLowerCase().includes("information related to")) {
+            log.info(`Avoiding recursive subqueries for query "${query.substring(0, 50)}..."`);
+            return [{
+                id: this.generateSubQueryId(),
+                text: query,
+                reason: AGENT_TOOL_PROMPTS.QUERY_DECOMPOSITION.SUB_QUERY_DIRECT_ANALYSIS,
+                isAnswered: false
+            }];
+        }
+
+        // First, add the original query as a sub-query (always)
+        subQueries.push({
+            id: this.generateSubQueryId(),
+            text: query,
+            reason: AGENT_TOOL_PROMPTS.QUERY_DECOMPOSITION.ORIGINAL_QUERY,
+            isAnswered: false
+        });
+
+        // Check for "compare", "difference", "versus" to identify comparison questions
+        if (
+            query.toLowerCase().includes('compare') ||
+            query.toLowerCase().includes('difference between') ||
+            query.toLowerCase().includes(' vs ') ||
+            query.toLowerCase().includes('versus')
+        ) {
+            // Extract entities to compare (simplified approach)
+            const entities = this.extractEntitiesForComparison(query);
+
+            if (entities.length >= 2) {
+                // Add sub-queries for each entity
+                entities.forEach(entity => {
+                    subQueries.push({
+                        id: this.generateSubQueryId(),
+                        text: `What are the key characteristics of ${entity}?`,
+                        reason: `Getting details about "${entity}" for comparison`,
+                        isAnswered: false
+                    });
+                });
+
+                // Add explicit comparison sub-query
+                subQueries.push({
+                    id: this.generateSubQueryId(),
+                    text: `How do ${entities.join(' and ')} compare in terms of their primary features?`,
+                    reason: 'Direct comparison of the entities',
+                    isAnswered: false
+                });
+            }
+        }
+        // Check for "how to" questions
+        else if (query.toLowerCase().includes('how to ')) {
+            const topic = query.replace(/how to /i, '').trim();
+
+            subQueries.push({
+                id: this.generateSubQueryId(),
+                text: `What are the steps to ${topic}?`,
+                reason: 'Finding procedural information',
+                isAnswered: false
+            });
+
+            subQueries.push({
+                id: this.generateSubQueryId(),
+                text: `What are common challenges or pitfalls when trying to ${topic}?`,
+                reason: 'Identifying potential difficulties',
+                isAnswered: false
+            });
+        }
+        // Check for "why" questions
+        else if (query.toLowerCase().startsWith('why ')) {
+            const topic = query.replace(/why /i, '').trim();
+
+            subQueries.push({
+                id: this.generateSubQueryId(),
+                text: `What are the causes of ${topic}?`,
+                reason: 'Identifying causes',
+                isAnswered: false
+            });
+
+            subQueries.push({
+                id: this.generateSubQueryId(),
+                text: `What evidence supports explanations for ${topic}?`,
+                reason: 'Finding supporting evidence',
+                isAnswered: false
+            });
+        }
+        // Handle "what is" questions
+        else if (query.toLowerCase().startsWith('what is ') || query.toLowerCase().startsWith('what are ')) {
+            const topic = query.replace(/what (is|are) /i, '').trim().replace(/\?$/, '');
+
+            subQueries.push({
+                id: this.generateSubQueryId(),
+                text: `Definition of ${topic}`,
+                reason: 'Getting basic definition',
+                isAnswered: false
+            });
+
+            subQueries.push({
+                id: this.generateSubQueryId(),
+                text: `Examples of ${topic}`,
+                reason: 'Finding examples',
+                isAnswered: false
+            });
+        }
+
+        // If no specific sub-queries were added (beyond the original),
+        // generate generic exploratory sub-queries
+        if (subQueries.length <= 1) {
+            // Extract main entities/concepts from the query
+            const concepts = this.extractMainConcepts(query);
+
+            concepts.forEach(concept => {
+                // Don't create recursive or self-referential queries
+                if (!concept.toLowerCase().includes('provide details') &&
+                    !concept.toLowerCase().includes('information related')) {
+                    subQueries.push({
+                        id: this.generateSubQueryId(),
+                        text: `Key information about ${concept}`,
+                        reason: `Finding information about "${concept}"`,
+                        isAnswered: false
+                    });
+                }
+            });
+        }
+
+        return subQueries;
+    }
+
+    /**
+     * Truncate text to a maximum length with ellipsis
+     */
+    private truncateText(text: string, maxLength: number): string {
+        if (text.length <= maxLength) return text;
+        return text.substring(0, maxLength - 3) + '...';
+    }
+
+    /**
+     * Extract entities for comparison from a query
+     *
+     * @param query The query to extract entities from
+     * @returns Array of entity strings
+     */
+    extractEntitiesForComparison(query: string): string[] {
+        // Try to match patterns like "compare X and Y" or "difference between X and Y"
+        const comparePattern = /\b(?:compare|difference between|similarities between)\s+([^,]+?)\s+(?:and|with|to)\s+([^,\?\.]+)/i;
+        const vsPattern = /\b([^,]+?)\s+(?:vs\.?|versus)\s+([^,\?\.]+)/i;
+
+        let match = query.match(comparePattern) || query.match(vsPattern);
+
+        if (match) {
+            return [match[1].trim(), match[2].trim()];
+        }
+
+        // If no pattern match, try to extract noun phrases
+        const words = query.split(/\s+/);
+        const potentialEntities = [];
+        let currentPhrase = '';
+
+        for (const word of words) {
+            // Skip common words that are unlikely to be part of entity names
+            if (/^(the|of|and|or|vs|versus|between|comparison|compared|to|with|what|is|are|how|why|when|which)$/i.test(word)) {
+                if (currentPhrase.trim()) {
+                    potentialEntities.push(currentPhrase.trim());
+                    currentPhrase = '';
+                }
+                continue;
+            }
+
+            currentPhrase += word + ' ';
+        }
+
+        if (currentPhrase.trim()) {
+            potentialEntities.push(currentPhrase.trim());
+        }
+
+        return potentialEntities.slice(0, 2); // Return at most 2 entities
+    }
+
+    /**
+     * Extract main concepts from a query
+     *
+     * @param query The query to extract concepts from
+     * @returns Array of concept strings
+     */
+    extractMainConcepts(query: string): string[] {
+        // Remove question words and common stop words
+        const cleanedQuery = query.replace(/what|is|are|how|why|when|which|the|of|and|or|to|with|in|on|by/gi, ' ');
+
+        // Split into words and filter out short words
+        const words = cleanedQuery.split(/\s+/).filter(word => word.length > 3);
+
+        // Count word frequency
+        const wordCounts: Record<string, number> = {};
+        for (const word of words) {
+            wordCounts[word.toLowerCase()] = (wordCounts[word.toLowerCase()] || 0) + 1;
+        }
+
+        // Sort by frequency
+        const sortedWords = Object.entries(wordCounts)
+            .sort((a, b) => b[1] - a[1])
+            .map(entry => entry[0]);
+
+        // Try to build meaningful phrases around top words
+        const conceptPhrases: string[] = [];
+
+        if (sortedWords.length === 0) {
+            // Fallback if no significant words found
+            return [query.trim()];
+        }
+
+        // Use the top 2-3 words to form concepts
+        for (let i = 0; i < Math.min(sortedWords.length, 3); i++) {
+            const word = sortedWords[i];
+
+            // Try to find the word in the original query and extract a small phrase around it
+            const wordIndex = query.toLowerCase().indexOf(word);
+            if (wordIndex >= 0) {
+                // Extract a window of text around the word (3 words before and after)
+                const start = Math.max(0, query.lastIndexOf(' ', wordIndex - 15) + 1);
+                const end = Math.min(query.length, query.indexOf(' ', wordIndex + word.length + 15));
+
+                if (end > start) {
+                    conceptPhrases.push(query.substring(start, end).trim());
+                } else {
+                    conceptPhrases.push(word);
+                }
+            } else {
+                conceptPhrases.push(word);
+            }
+        }
+
+        return conceptPhrases;
+    }
+}
+
+export default QueryDecompositionTool;
diff --git a/src/services/llm/context_extractors/vector_search_tool.ts b/src/services/llm/context_extractors/vector_search_tool.ts
new file mode 100644
index 000000000..a9f962e8f
--- /dev/null
+++ b/src/services/llm/context_extractors/vector_search_tool.ts
@@ -0,0 +1,218 @@
+/**
+ * Vector Search Tool
+ *
+ * This tool enables the LLM agent to perform semantic vector-based searches
+ * over the content in the notes database. It handles:
+ * - Finding semantically related notes to a query
+ * - Extracting relevant sections from notes
+ * - Providing relevant context for LLM to generate accurate responses
+ *
+ * Updated to use the consolidated VectorSearchService
+ */
+
+import log from '../../log.js';
+import type { ContextService } from '../context/services/context_service.js';
+import vectorSearchService from '../context/services/vector_search_service.js';
+
+export interface VectorSearchResult {
+    noteId: string;
+    title: string;
+    contentPreview: string;
+    similarity: number;
+    parentId?: string;
+    dateCreated?: string;
+    dateModified?: string;
+}
+
+export interface SearchResultItem {
+    noteId: string;
+    noteTitle: string;
+    contentPreview: string;
+    similarity: number;
+    parentId?: string;
+    dateCreated?: string;
+    dateModified?: string;
+}
+
+export interface VectorSearchOptions {
+    limit?: number;
+    threshold?: number;
+    includeContent?: boolean;
+    summarize?: boolean;
+}
+
+// Define a type for the context service
+export interface IVectorContextService {
+    findRelevantNotes?: (query: string, contextNoteId: string | null, options: Record<string, unknown>) => Promise<unknown[]>;
+}
+
+export class VectorSearchTool {
+    private contextService: IVectorContextService | null = null;
+    private maxResults: number = 5;
+
+    constructor() {
+        log.info('VectorSearchTool initialized using consolidated VectorSearchService');
+    }
+
+    /**
+     * Set the context service for performing vector searches
+     */
+    setContextService(contextService: IVectorContextService): void {
+        this.contextService = contextService;
+        log.info('Context service set in VectorSearchTool');
+    }
+
+    /**
+     * Perform a vector search for related notes
+     */
+    async search(
+        query: string,
+        contextNoteId?: string,
+        searchOptions: VectorSearchOptions = {}
+    ): Promise<VectorSearchResult[]> {
+        try {
+            // Set more aggressive defaults to return more content
+            const options = {
+                maxResults: searchOptions.limit || 15, // Increased from default
+                threshold: searchOptions.threshold || 0.5, // Lower threshold to include more results
+                includeContent: searchOptions.includeContent !== undefined ? searchOptions.includeContent : true,
+                summarizeContent: searchOptions.summarize || false,
+                ...searchOptions
+            };
+
+            log.info(`Vector search: "${query.substring(0, 50)}..." with limit=${options.maxResults}, threshold=${options.threshold}`);
+
+            // Use the consolidated vector search service
+            const searchResults = await vectorSearchService.findRelevantNotes(
+                query,
+                contextNoteId || null,
+                {
+                    maxResults: options.maxResults,
+                    threshold: options.threshold,
+                    summarizeContent: options.summarizeContent
+                }
+            );
+
+            log.info(`Vector search found ${searchResults.length} relevant notes`);
+
+            // Format results to match the expected VectorSearchResult interface
+            return searchResults.map(note => ({
+                noteId: note.noteId,
+                title: note.title,
+                contentPreview: note.content
+                    ? (options.summarizeContent
+                        // Don't truncate already summarized content
+                        ? note.content
+                        // Only truncate non-summarized content
+                        : (note.content.length > 200
+                            ? note.content.substring(0, 200) + '...'
+                            : note.content))
+                    : 'No content available',
+                similarity: note.similarity,
+                parentId: note.parentId
+            }));
+        } catch (error) {
+            log.error(`Vector search error: ${error}`);
+            return [];
+        }
+    }
+
+    /**
+     * Search for notes that are semantically related to the query
+     */
+    async searchNotes(query: string, options: {
+        parentNoteId?: string,
+        maxResults?: number,
+        similarityThreshold?: number,
+        summarize?: boolean
+    } = {}): Promise<VectorSearchResult[]> {
+        try {
+            // Set defaults
+            const maxResults = options.maxResults || this.maxResults;
+            const threshold = options.similarityThreshold || 0.6;
+            const parentNoteId = options.parentNoteId || null;
+            const summarize = options.summarize || false;
+
+            // Use the consolidated vector search service
+            const results = await vectorSearchService.findRelevantNotes(
+                query,
+                parentNoteId,
+                {
+                    maxResults,
+                    threshold,
+                    summarizeContent: summarize
+                }
+            );
+
+            // Format results to match the expected interface
+            return results.map(result => ({
+                noteId: result.noteId,
+                title: result.title,
+                contentPreview: result.content
+                    ? (summarize
+                        // Don't truncate already summarized content
+                        ? result.content
+                        // Only truncate non-summarized content
+                        : (result.content.length > 200
+                            ? result.content.substring(0, 200) + '...'
+                            : result.content))
+                    : 'No content available',
+                similarity: result.similarity,
+                parentId: result.parentId
+            }));
+        } catch (error) {
+            log.error(`Error in vector search: ${error}`);
+            return [];
+        }
+    }
+
+    /**
+     * Search for content chunks that are semantically related to the query
+     */
+    async searchContentChunks(query: string, options: {
+        noteId?: string,
+        maxResults?: number,
+        similarityThreshold?: number,
+        summarize?: boolean
+    } = {}): Promise<VectorSearchResult[]> {
+        try {
+            // For now, use the same implementation as searchNotes,
+            // but in the future we'll implement chunk-based search
+            return this.searchNotes(query, {
+                parentNoteId: options.noteId,
+                maxResults: options.maxResults,
+                similarityThreshold: options.similarityThreshold,
+                summarize: options.summarize
+            });
+        } catch (error) {
+            log.error(`Error in vector chunk search: ${error}`);
+            return [];
+        }
+    }
+
+    /**
+     * Elaborate on why certain results were returned for a query
+     */
+    explainResults(query: string, results: VectorSearchResult[]): string {
+        if (!query || !results || results.length === 0) {
+            return "No results to explain.";
+        }
+
+        let explanation = `For query "${query}", I found these semantically related notes:\n\n`;
+
+        results.forEach((result, index) => {
+            explanation += `${index + 1}. "${result.title}" (similarity: ${(result.similarity * 100).toFixed(1)}%)\n`;
+            explanation += `   Preview: ${result.contentPreview.substring(0, 150)}...\n`;
+
+            if (index < results.length - 1) {
+                explanation += "\n";
+            }
+        });
+
+        explanation += "\nThese results were found based on semantic similarity rather than just keyword matching.";
+
+        return explanation;
+    }
+}
+
+export default new VectorSearchTool();
diff --git a/src/services/llm/embeddings/base_embeddings.ts b/src/services/llm/embeddings/base_embeddings.ts
new file mode 100644
index 000000000..ffc57174c
--- /dev/null
+++ b/src/services/llm/embeddings/base_embeddings.ts
@@ -0,0 +1,438 @@
+import { NormalizationStatus } from './embeddings_interface.js';
+import type { NoteEmbeddingContext } from './embeddings_interface.js';
+import log from "../../log.js";
+import { LLM_CONSTANTS } from "../constants/provider_constants.js";
+import options from "../../options.js";
+import { isBatchSizeError as checkBatchSizeError } from '../interfaces/error_interfaces.js';
+import type { EmbeddingModelInfo } from '../interfaces/embedding_interfaces.js';
+
+export interface EmbeddingConfig {
+    model: string;
+    dimension: number;
+    type: 'float32' | 'float64';
+    apiKey?: string;
+    baseUrl?: string;
+    batchSize?: number;
+    contextWidth?: number;
+    normalizationStatus?: NormalizationStatus;
+}
+
+/**
+ * Base class for embedding providers that implements common functionality
+ */
+export abstract class BaseEmbeddingProvider {
+    protected model: string;
+    protected dimension: number;
+    protected type: 'float32' | 'float64';
+    protected maxBatchSize: number = 100;
+    protected apiKey?: string;
+    protected baseUrl: string;
+    protected name: string = 'base';
+    protected modelInfoCache = new Map<string, EmbeddingModelInfo>();
+    protected config: EmbeddingConfig;
+
+    constructor(config: EmbeddingConfig) {
+        this.model = config.model;
+        this.dimension = config.dimension;
+        this.type = config.type;
+        this.apiKey = config.apiKey;
+        this.baseUrl = config.baseUrl || '';
+        this.config = config;
+
+        // If batch size is specified, use it as maxBatchSize
+        if (config.batchSize) {
+            this.maxBatchSize = config.batchSize;
+        }
+    }
+
+    getConfig(): EmbeddingConfig {
+        return { ...this.config };
+    }
+
+    /**
+     * Get the normalization status of this provider
+     * Default implementation returns the status from config if available,
+     * otherwise returns UNKNOWN status
+     */
+    getNormalizationStatus(): NormalizationStatus {
+        return this.config.normalizationStatus || NormalizationStatus.UNKNOWN;
+    }
+
+    getDimension(): number {
+        return this.config.dimension;
+    }
+
+    async initialize(): Promise<void> {
+        // Default implementation does nothing
+        return;
+    }
+
+    /**
+     * Generate embeddings for a single text
+     */
+    abstract generateEmbeddings(text: string): Promise<Float32Array>;
+
+    /**
+     * Get the appropriate batch size for this provider
+     * Override in provider implementations if needed
+     */
+    protected async getBatchSize(): Promise<number> {
+        // Try to get the user-configured batch size
+        let configuredBatchSize: number | null = null;
+
+        try {
+            const batchSizeStr = await options.getOption('embeddingBatchSize');
+            if (batchSizeStr) {
+                configuredBatchSize = parseInt(batchSizeStr, 10);
+            }
+        } catch (error) {
+            log.error(`Error getting batch size from options: ${error}`);
+        }
+
+        // If user has configured a specific batch size, use that
+        if (configuredBatchSize && !isNaN(configuredBatchSize) && configuredBatchSize > 0) {
+            return configuredBatchSize;
+        }
+
+        // Otherwise use the provider-specific default from constants
+        return this.config.batchSize ||
+               LLM_CONSTANTS.BATCH_SIZE[this.name.toUpperCase() as keyof typeof LLM_CONSTANTS.BATCH_SIZE] ||
+               LLM_CONSTANTS.BATCH_SIZE.DEFAULT;
+    }
+
+    /**
+     * Process a batch of texts with adaptive handling
+     * This method will try to process the batch and reduce batch size if encountering errors
+     */
+    protected async processWithAdaptiveBatch<T, R>(
+        items: T[],
+        processFn: (batch: T[]) => Promise<R[]>,
+        isBatchSizeError: (error: unknown) => boolean
+    ): Promise<R[]> {
+        const results: R[] = [];
+        const failures: { index: number, error: string }[] = [];
+        let currentBatchSize = await this.getBatchSize();
+        let lastError: Error | null = null;
+
+        // Process items in batches
+        for (let i = 0; i < items.length;) {
+            const batch = items.slice(i, i + currentBatchSize);
+
+            try {
+                // Process the current batch
+                const batchResults = await processFn(batch);
+                results.push(...batchResults);
+                i += batch.length;
+            }
+            catch (error) {
+                lastError = error as Error;
+                const errorMessage = (lastError as Error).message || 'Unknown error';
+
+                // Check if this is a batch size related error
+                if (isBatchSizeError(error) && currentBatchSize > 1) {
+                    // Reduce batch size and retry
+                    const newBatchSize = Math.max(1, Math.floor(currentBatchSize / 2));
+                    console.warn(`Batch size error detected, reducing batch size from ${currentBatchSize} to ${newBatchSize}: ${errorMessage}`);
+                    currentBatchSize = newBatchSize;
+                }
+                else if (currentBatchSize === 1) {
+                    // If we're already at batch size 1, we can't reduce further, so log the error and skip this item
+                    log.error(`Error processing item at index ${i} with batch size 1: ${errorMessage}`);
+                    failures.push({ index: i, error: errorMessage });
+                    i++; // Move to the next item
+                }
+                else {
+                    // For other errors, retry with a smaller batch size as a precaution
+                    const newBatchSize = Math.max(1, Math.floor(currentBatchSize / 2));
+                    console.warn(`Error processing batch, reducing batch size from ${currentBatchSize} to ${newBatchSize} as a precaution: ${errorMessage}`);
+                    currentBatchSize = newBatchSize;
+                }
+            }
+        }
+
+        // If all items failed and we have a last error, throw it
+        if (results.length === 0 && failures.length > 0 && lastError) {
+            throw lastError;
+        }
+
+        // If some items failed but others succeeded, log the summary
+        if (failures.length > 0) {
+            console.warn(`Processed ${results.length} items successfully, but ${failures.length} items failed`);
+        }
+
+        return results;
+    }
+
+    /**
+     * Detect if an error is related to batch size limits
+     * Override in provider-specific implementations
+     */
+    protected isBatchSizeError(error: unknown): boolean {
+        return checkBatchSizeError(error);
+    }
+
+    /**
+     * Generate embeddings for multiple texts
+     * Default implementation processes texts one by one
+     */
+    async generateBatchEmbeddings(texts: string[]): Promise<Float32Array[]> {
+        if (texts.length === 0) {
+            return [];
+        }
+
+        try {
+            return await this.processWithAdaptiveBatch(
+                texts,
+                async (batch) => {
+                    const batchResults = await Promise.all(
+                        batch.map(text => this.generateEmbeddings(text))
+                    );
+                    return batchResults;
+                },
+                this.isBatchSizeError.bind(this)
+            );
+        }
+        catch (error) {
+            const errorMessage = (error as Error).message || "Unknown error";
+            log.error(`Batch embedding error for provider ${this.name}: ${errorMessage}`);
+            throw new Error(`${this.name} batch embedding error: ${errorMessage}`);
+        }
+    }
+
+    /**
+     * Generate embeddings for a note with its context
+     */
+    async generateNoteEmbeddings(context: NoteEmbeddingContext): Promise<Float32Array> {
+        const text = [context.title || "", context.content || ""].filter(Boolean).join(" ");
+        return this.generateEmbeddings(text);
+    }
+
+    /**
+     * Generate embeddings for multiple notes with their contexts
+     */
+    async generateBatchNoteEmbeddings(contexts: NoteEmbeddingContext[]): Promise<Float32Array[]> {
+        if (contexts.length === 0) {
+            return [];
+        }
+
+        try {
+            return await this.processWithAdaptiveBatch(
+                contexts,
+                async (batch) => {
+                    const batchResults = await Promise.all(
+                        batch.map(context => this.generateNoteEmbeddings(context))
+                    );
+                    return batchResults;
+                },
+                this.isBatchSizeError.bind(this)
+            );
+        }
+        catch (error) {
+            const errorMessage = (error as Error).message || "Unknown error";
+            log.error(`Batch note embedding error for provider ${this.name}: ${errorMessage}`);
+            throw new Error(`${this.name} batch note embedding error: ${errorMessage}`);
+        }
+    }
+
+    /**
+     * Cleans and normalizes text for embeddings by removing excessive whitespace
+     */
+    private cleanText(text: string): string {
+        return text.replace(/\s+/g, ' ').trim();
+    }
+
+    /**
+     * Generates a rich text representation of a note's context for embedding
+     */
+    protected generateNoteContextText(context: NoteEmbeddingContext): string {
+        // Build a relationship-focused summary first
+        const relationshipSummary = [];
+
+        // Summarize the note's place in the hierarchy
+        if (context.parentTitles.length > 0) {
+            relationshipSummary.push(`This note is a child of: ${context.parentTitles.map(t => this.cleanText(t)).join(', ')}.`);
+        }
+
+        if (context.childTitles.length > 0) {
+            relationshipSummary.push(`This note has children: ${context.childTitles.map(t => this.cleanText(t)).join(', ')}.`);
+        }
+
+        // Emphasize relationships with other notes
+        if (context.relatedNotes && context.relatedNotes.length > 0) {
+            // Group by relation type for better understanding
+            const relationsByType: Record<string, string[]> = {};
+            for (const rel of context.relatedNotes) {
+                if (!relationsByType[rel.relationName]) {
+                    relationsByType[rel.relationName] = [];
+                }
+                relationsByType[rel.relationName].push(this.cleanText(rel.targetTitle));
+            }
+
+            for (const [relType, targets] of Object.entries(relationsByType)) {
+                relationshipSummary.push(`This note has ${relType} relationship with: ${targets.join(', ')}.`);
+            }
+        }
+
+        // Emphasize backlinks for bidirectional relationships
+        if (context.backlinks && context.backlinks.length > 0) {
+            // Group by relation type
+            const backlinksByType: Record<string, string[]> = {};
+            for (const link of context.backlinks) {
+                if (!backlinksByType[link.relationName]) {
+                    backlinksByType[link.relationName] = [];
+                }
+                backlinksByType[link.relationName].push(this.cleanText(link.sourceTitle));
+            }
+
+            for (const [relType, sources] of Object.entries(backlinksByType)) {
+                relationshipSummary.push(`This note is ${relType} of: ${sources.join(', ')}.`);
+            }
+        }
+
+        // Emphasize templates/inheritance
+        if (context.templateTitles && context.templateTitles.length > 0) {
+            relationshipSummary.push(`This note inherits from: ${context.templateTitles.map(t => this.cleanText(t)).join(', ')}.`);
+        }
+
+        // Start with core note information
+        let result =
+            `Title: ${this.cleanText(context.title)}\n` +
+            `Type: ${context.type}\n` +
+            `MIME: ${context.mime}\n`;
+
+        // Add the relationship summary at the beginning for emphasis
+        if (relationshipSummary.length > 0) {
+            result += `Relationships: ${relationshipSummary.join(' ')}\n`;
+        }
+
+        // Continue with dates
+        result +=
+            `Created: ${context.dateCreated}\n` +
+            `Modified: ${context.dateModified}\n`;
+
+        // Add attributes in a concise format
+        if (context.attributes.length > 0) {
+            result += 'Attributes: ';
+            const attributeTexts = context.attributes.map(attr =>
+                `${attr.type}:${attr.name}=${this.cleanText(attr.value)}`
+            );
+            result += attributeTexts.join('; ') + '\n';
+        }
+
+        // Add important label values concisely
+        if (context.labelValues && Object.keys(context.labelValues).length > 0) {
+            result += 'Labels: ';
+            const labelTexts = Object.entries(context.labelValues).map(([name, value]) =>
+                `${name}=${this.cleanText(value)}`
+            );
+            result += labelTexts.join('; ') + '\n';
+        }
+
+        // Parents, children, templates, relations, and backlinks are now handled in the relationship summary
+        // But we'll include them again in a more structured format for organization
+
+        if (context.parentTitles.length > 0) {
+            result += `Parents: ${context.parentTitles.map(t => this.cleanText(t)).join('; ')}\n`;
+        }
+
+        if (context.childTitles.length > 0) {
+            result += `Children: ${context.childTitles.map(t => this.cleanText(t)).join('; ')}\n`;
+        }
+
+        if (context.templateTitles && context.templateTitles.length > 0) {
+            result += `Templates: ${context.templateTitles.map(t => this.cleanText(t)).join('; ')}\n`;
+        }
+
+        if (context.relatedNotes && context.relatedNotes.length > 0) {
+            result += 'Related: ';
+            const relatedTexts = context.relatedNotes.map(rel =>
+                `${rel.relationName}→${this.cleanText(rel.targetTitle)}`
+            );
+            result += relatedTexts.join('; ') + '\n';
+        }
+
+        if (context.backlinks && context.backlinks.length > 0) {
+            result += 'Referenced By: ';
+            const backlinkTexts = context.backlinks.map(link =>
+                `${this.cleanText(link.sourceTitle)}→${link.relationName}`
+            );
+            result += backlinkTexts.join('; ') + '\n';
+        }
+
+        // Add attachments concisely
+        if (context.attachments.length > 0) {
+            result += 'Attachments: ';
+            const attachmentTexts = context.attachments.map(att =>
+                `${this.cleanText(att.title)}(${att.mime})`
+            );
+            result += attachmentTexts.join('; ') + '\n';
+        }
+
+        // Add content (already cleaned in getNoteEmbeddingContext)
+        result += `Content: ${context.content}`;
+
+        return result;
+    }
+
+    /**
+     * Process a batch of items with automatic retries and batch size adjustment
+     */
+    protected async processBatchWithRetries<T>(
+        items: T[],
+        processFn: (batch: T[]) => Promise<Float32Array[]>,
+        isBatchSizeError: (error: unknown) => boolean = this.isBatchSizeError.bind(this)
+    ): Promise<Float32Array[]> {
+        const results: Float32Array[] = [];
+        const failures: { index: number, error: string }[] = [];
+        let currentBatchSize = await this.getBatchSize();
+        let lastError: Error | null = null;
+
+        // Process items in batches
+        for (let i = 0; i < items.length;) {
+            const batch = items.slice(i, i + currentBatchSize);
+
+            try {
+                // Process the current batch
+                const batchResults = await processFn(batch);
+                results.push(...batchResults);
+                i += batch.length;
+            }
+            catch (error) {
+                lastError = error as Error;
+                const errorMessage = lastError.message || 'Unknown error';
+
+                // Check if this is a batch size related error
+                if (isBatchSizeError(error) && currentBatchSize > 1) {
+                    // Reduce batch size and retry
+                    const newBatchSize = Math.max(1, Math.floor(currentBatchSize / 2));
+                    console.warn(`Batch size error detected, reducing batch size from ${currentBatchSize} to ${newBatchSize}: ${errorMessage}`);
+                    currentBatchSize = newBatchSize;
+                }
+                else if (currentBatchSize === 1) {
+                    // If we're already at batch size 1, we can't reduce further, so log the error and skip this item
+                    console.error(`Error processing item at index ${i} with batch size 1: ${errorMessage}`);
+                    failures.push({ index: i, error: errorMessage });
+                    i++; // Move to the next item
+                }
+                else {
+                    // For other errors, retry with a smaller batch size as a precaution
+                    const newBatchSize = Math.max(1, Math.floor(currentBatchSize / 2));
+                    console.warn(`Error processing batch, reducing batch size from ${currentBatchSize} to ${newBatchSize} as a precaution: ${errorMessage}`);
+                    currentBatchSize = newBatchSize;
+                }
+            }
+        }
+
+        // If all items failed and we have a last error, throw it
+        if (results.length === 0 && failures.length > 0 && lastError) {
+            throw lastError;
+        }
+
+        // If some items failed but others succeeded, log the summary
+        if (failures.length > 0) {
+            console.warn(`Processed ${results.length} items successfully, but ${failures.length} items failed`);
+        }
+
+        return results;
+    }
+}
diff --git a/src/services/llm/embeddings/chunking/chunking_interface.ts b/src/services/llm/embeddings/chunking/chunking_interface.ts
new file mode 100644
index 000000000..d2515ac02
--- /dev/null
+++ b/src/services/llm/embeddings/chunking/chunking_interface.ts
@@ -0,0 +1,25 @@
+import type { NoteEmbeddingContext } from "../types.js";
+import type { EmbeddingProvider } from "../embeddings_interface.js";
+
+/**
+ * Interface for chunking operations
+ */
+export interface ChunkingOperations {
+    /**
+     * Process a large note by breaking it into chunks and creating embeddings for each chunk
+     */
+    processNoteWithChunking(
+        noteId: string,
+        provider: EmbeddingProvider,
+        context: NoteEmbeddingContext
+    ): Promise<void>;
+}
+
+/**
+ * Get the chunking operations instance
+ * This function is implemented to break circular dependencies
+ */
+export async function getChunkingOperations(): Promise<ChunkingOperations> {
+    const chunking = await import('./chunking_processor.js');
+    return chunking;
+}
diff --git a/src/services/llm/embeddings/chunking/chunking_processor.ts b/src/services/llm/embeddings/chunking/chunking_processor.ts
new file mode 100644
index 000000000..60e1267fa
--- /dev/null
+++ b/src/services/llm/embeddings/chunking/chunking_processor.ts
@@ -0,0 +1,477 @@
+import log from "../../../log.js";
+import dateUtils from "../../../date_utils.js";
+import sql from "../../../sql.js";
+import becca from "../../../../becca/becca.js";
+import cls from "../../../../services/cls.js";
+import type { NoteEmbeddingContext } from "../types.js";
+import type { EmbeddingProvider } from "../embeddings_interface.js";
+import type { EmbeddingConfig } from "../embeddings_interface.js";
+import { LLM_CONSTANTS } from "../../../llm/constants/provider_constants.js";
+import { EMBEDDING_PROCESSING } from '../../constants/search_constants.js';
+
+// Define error categories for better handling
+const ERROR_CATEGORIES = {
+    // Temporary errors that should be retried
+    TEMPORARY: {
+        patterns: [
+            'timeout', 'connection', 'network', 'rate limit', 'try again',
+            'service unavailable', 'too many requests', 'server error',
+            'gateway', 'temporarily', 'overloaded'
+        ]
+    },
+    // Permanent errors that should not be retried
+    PERMANENT: {
+        patterns: [
+            'invalid request', 'invalid content', 'not found', 'unsupported model',
+            'invalid model', 'content policy', 'forbidden', 'unauthorized',
+            'token limit', 'context length', 'too long', 'content violation'
+        ]
+    }
+};
+
+// Maximum time (in milliseconds) allowed for the entire chunking process
+const MAX_TOTAL_PROCESSING_TIME = EMBEDDING_PROCESSING.MAX_TOTAL_PROCESSING_TIME;
+
+// Maximum number of retry attempts per chunk
+const MAX_CHUNK_RETRY_ATTEMPTS = EMBEDDING_PROCESSING.MAX_CHUNK_RETRY_ATTEMPTS;
+
+// Maximum time per chunk processing (to prevent individual chunks from hanging)
+const DEFAULT_MAX_CHUNK_PROCESSING_TIME = EMBEDDING_PROCESSING.DEFAULT_MAX_CHUNK_PROCESSING_TIME;
+const OLLAMA_MAX_CHUNK_PROCESSING_TIME = EMBEDDING_PROCESSING.OLLAMA_MAX_CHUNK_PROCESSING_TIME;
+
+/**
+ * Interface for chunks from the chunking process
+ */
+interface ContentChunk {
+    content: string;
+    index: number;
+    metadata?: Record<string, unknown>;
+}
+
+/**
+ * Categorize an error as temporary or permanent based on its message
+ * @param errorMessage - The error message to categorize
+ * @returns 'temporary', 'permanent', or 'unknown'
+ */
+function categorizeError(errorMessage: string): 'temporary' | 'permanent' | 'unknown' {
+    const lowerCaseMessage = errorMessage.toLowerCase();
+
+    // Check for temporary error patterns
+    for (const pattern of ERROR_CATEGORIES.TEMPORARY.patterns) {
+        if (lowerCaseMessage.includes(pattern.toLowerCase())) {
+            return 'temporary';
+        }
+    }
+
+    // Check for permanent error patterns
+    for (const pattern of ERROR_CATEGORIES.PERMANENT.patterns) {
+        if (lowerCaseMessage.includes(pattern.toLowerCase())) {
+            return 'permanent';
+        }
+    }
+
+    // Default to unknown
+    return 'unknown';
+}
+
+/**
+ * Process a chunk with a timeout to prevent hanging
+ * @param provider - The embedding provider
+ * @param chunk - The chunk to process
+ * @param timeoutMs - Timeout in milliseconds
+ * @returns The generated embedding
+ */
+async function processChunkWithTimeout(
+    provider: EmbeddingProvider,
+    chunk: { content: string },
+    timeoutMs: number
+): Promise<Float32Array> {
+    // Create a promise that rejects after the timeout
+    const timeoutPromise = new Promise<never>((_, reject) => {
+        setTimeout(() => {
+            reject(new Error(`Chunk processing timed out after ${timeoutMs}ms`));
+        }, timeoutMs);
+    });
+
+    // Create the actual processing promise
+    const processingPromise = provider.generateEmbeddings(chunk.content);
+
+    // Race the two promises - whichever completes/rejects first wins
+    return Promise.race([processingPromise, timeoutPromise]);
+}
+
+/**
+ * Process a large note by breaking it into chunks and creating embeddings for each chunk
+ * This provides more detailed and focused embeddings for different parts of large notes
+ *
+ * @param noteId - The ID of the note to process
+ * @param provider - The embedding provider to use
+ * @param context - The note context data
+ */
+export async function processNoteWithChunking(
+    noteId: string,
+    provider: EmbeddingProvider,
+    context: NoteEmbeddingContext
+): Promise<void> {
+    // Track the overall start time
+    const startTime = Date.now();
+
+    try {
+        // Get the context extractor dynamically to avoid circular dependencies
+        const { ContextExtractor } = await import('../../context/index.js');
+        const contextExtractor = new ContextExtractor();
+
+        // Get note from becca
+        const note = becca.notes[noteId];
+        if (!note) {
+            throw new Error(`Note ${noteId} not found in Becca cache`);
+        }
+
+        // Use semantic chunking for better boundaries
+        const chunks = await contextExtractor.semanticChunking(
+            context.content,
+            note.title,
+            noteId,
+            {
+                // Adjust chunk size based on provider using constants
+                maxChunkSize: provider.name === 'ollama' ?
+                    LLM_CONSTANTS.CHUNKING.OLLAMA_SIZE :
+                    LLM_CONSTANTS.CHUNKING.DEFAULT_SIZE,
+                respectBoundaries: true
+            }
+        );
+
+        if (!chunks || chunks.length === 0) {
+            // Fall back to single embedding if chunking fails
+            await cls.init(async () => {
+                const embedding = await provider.generateEmbeddings(context.content);
+                const config = provider.getConfig();
+
+                // Use dynamic import instead of static import
+                const storage = await import('../storage.js');
+                await storage.storeNoteEmbedding(noteId, provider.name, config.model, embedding);
+            });
+
+            log.info(`Generated single embedding for note ${noteId} (${note.title}) since chunking failed`);
+            return;
+        }
+
+        // Generate and store embeddings for each chunk
+        const config = provider.getConfig();
+
+        // Delete existing embeddings first to avoid duplicates
+        // Use dynamic import
+        const storage = await import('../storage.js');
+        await storage.deleteNoteEmbeddings(noteId, provider.name, config.model);
+
+        // Track successful and failed chunks in memory during this processing run
+        let successfulChunks = 0;
+        let failedChunks = 0;
+        const totalChunks = chunks.length;
+        const failedChunkDetails: {
+            index: number,
+            error: string,
+            category: 'temporary' | 'permanent' | 'unknown',
+            attempts: number
+        }[] = [];
+        const retryQueue: {
+            index: number,
+            chunk: any,
+            attempts: number
+        }[] = [];
+
+        log.info(`Processing ${chunks.length} chunks for note ${noteId} (${note.title})`);
+
+        // Get the current time to prevent duplicate processing from timeouts
+        const processingStartTime = Date.now();
+        const processingId = `${noteId}-${processingStartTime}`;
+        log.info(`Starting processing run ${processingId}`);
+
+        // Process each chunk with a delay based on provider to avoid rate limits
+        for (let i = 0; i < chunks.length; i++) {
+            // Check if we've exceeded the overall time limit
+            if (Date.now() - startTime > MAX_TOTAL_PROCESSING_TIME) {
+                log.info(`Exceeded maximum processing time (${MAX_TOTAL_PROCESSING_TIME}ms) for note ${noteId}, stopping after ${i} chunks`);
+
+                // Mark remaining chunks as failed due to timeout
+                for (let j = i; j < chunks.length; j++) {
+                    failedChunks++;
+                    failedChunkDetails.push({
+                        index: j + 1,
+                        error: "Processing timeout - exceeded total allowed time",
+                        category: 'temporary',
+                        attempts: 1
+                    });
+                }
+
+                // Break the loop, we'll handle this as partial success if some chunks succeeded
+                break;
+            }
+
+            const chunk = chunks[i];
+            try {
+                // Generate embedding for this chunk's content with a timeout
+                await cls.init(async () => {
+                    const embedding = await processChunkWithTimeout(
+                        provider,
+                        chunk,
+                        provider.name === 'ollama' ? OLLAMA_MAX_CHUNK_PROCESSING_TIME : DEFAULT_MAX_CHUNK_PROCESSING_TIME
+                    );
+
+                    // Store with chunk information in a unique ID format
+                    const chunkIdSuffix = `${i + 1}_of_${chunks.length}`;
+                    await storage.storeNoteEmbedding(
+                        noteId,
+                        provider.name,
+                        config.model,
+                        embedding
+                    );
+                });
+
+                successfulChunks++;
+
+                // Small delay between chunks to avoid rate limits - longer for Ollama
+                if (i < chunks.length - 1) {
+                    await new Promise(resolve => setTimeout(resolve,
+                        provider.name === 'ollama' ? 2000 : 100));
+                }
+            } catch (error: any) {
+                const errorMessage = error.message || 'Unknown error';
+                const errorCategory = categorizeError(errorMessage);
+
+                // Track the failure for this specific chunk
+                failedChunks++;
+                failedChunkDetails.push({
+                    index: i + 1,
+                    error: errorMessage,
+                    category: errorCategory,
+                    attempts: 1
+                });
+
+                // Only add to retry queue if not a permanent error
+                if (errorCategory !== 'permanent') {
+                    retryQueue.push({
+                        index: i,
+                        chunk: chunk,
+                        attempts: 1
+                    });
+                } else {
+                    log.info(`Chunk ${i + 1} for note ${noteId} has permanent error, skipping retries: ${errorMessage}`);
+                }
+
+                log.error(`Error processing chunk ${i + 1} for note ${noteId} (${errorCategory} error): ${errorMessage}`);
+            }
+        }
+
+        // Set a time limit for the retry phase
+        const retryStartTime = Date.now();
+        const MAX_RETRY_TIME = 2 * 60 * 1000; // 2 minutes for all retries
+
+        // Retry failed chunks with exponential backoff, but only those that aren't permanent errors
+        if (retryQueue.length > 0 && retryQueue.length < chunks.length) {
+            log.info(`Retrying ${retryQueue.length} failed chunks for note ${noteId}`);
+
+            for (let j = 0; j < retryQueue.length; j++) {
+                // Check if we've exceeded the retry time limit
+                if (Date.now() - retryStartTime > MAX_RETRY_TIME) {
+                    log.info(`Exceeded maximum retry time (${MAX_RETRY_TIME}ms) for note ${noteId}, stopping after ${j} retries`);
+                    break;
+                }
+
+                const item = retryQueue[j];
+
+                // Skip if we've already reached the max retry attempts for this chunk
+                if (item.attempts >= MAX_CHUNK_RETRY_ATTEMPTS) {
+                    log.info(`Skipping chunk ${item.index + 1} for note ${noteId} as it reached maximum retry attempts (${MAX_CHUNK_RETRY_ATTEMPTS})`);
+                    continue;
+                }
+
+                try {
+                    // Wait longer for retries with exponential backoff
+                    await new Promise(resolve => setTimeout(resolve, 1000 * Math.pow(1.5, j)));
+
+                    // Retry the embedding with timeout using cls.init
+                    await cls.init(async () => {
+                        const embedding = await processChunkWithTimeout(
+                            provider,
+                            item.chunk,
+                            provider.name === 'ollama' ? OLLAMA_MAX_CHUNK_PROCESSING_TIME : DEFAULT_MAX_CHUNK_PROCESSING_TIME
+                        );
+
+                        // Store with unique ID that indicates it was a retry
+                        const chunkIdSuffix = `${item.index + 1}_of_${chunks.length}`;
+                        const storage = await import('../storage.js');
+                        await storage.storeNoteEmbedding(
+                            noteId,
+                            provider.name,
+                            config.model,
+                            embedding
+                        );
+                    });
+
+                    // Update counters
+                    successfulChunks++;
+                    failedChunks--;
+
+                    // Remove from failedChunkDetails
+                    const detailIndex = failedChunkDetails.findIndex(d => d.index === item.index + 1);
+                    if (detailIndex >= 0) {
+                        failedChunkDetails.splice(detailIndex, 1);
+                    }
+
+                    log.info(`Successfully retried chunk ${item.index + 1} for note ${noteId} on attempt ${item.attempts + 1}`);
+                } catch (error: any) {
+                    const errorMessage = error.message || 'Unknown error';
+                    const errorCategory = categorizeError(errorMessage);
+
+                    // Update failure record with new attempt count
+                    const detailIndex = failedChunkDetails.findIndex(d => d.index === item.index + 1);
+                    if (detailIndex >= 0) {
+                        failedChunkDetails[detailIndex].attempts++;
+                        failedChunkDetails[detailIndex].error = errorMessage;
+                        failedChunkDetails[detailIndex].category = errorCategory;
+                    }
+
+                    log.error(`Retry failed for chunk ${item.index + 1} of note ${noteId} (${errorCategory} error): ${errorMessage}`);
+
+                    // For timeout errors, mark as permanent to avoid further retries
+                    if (errorMessage.includes('timed out')) {
+                        if (detailIndex >= 0) {
+                            failedChunkDetails[detailIndex].category = 'permanent';
+                        }
+                        log.info(`Chunk ${item.index + 1} for note ${noteId} timed out, marking as permanent failure`);
+                    }
+                    // Add to retry queue again only if it's not a permanent error and hasn't reached the max attempts
+                    else if (errorCategory !== 'permanent' && item.attempts + 1 < MAX_CHUNK_RETRY_ATTEMPTS) {
+                        // If we're still below MAX_CHUNK_RETRY_ATTEMPTS, we'll try again in the next cycle
+                        item.attempts++;
+                    } else if (errorCategory === 'permanent') {
+                        log.info(`Chunk ${item.index + 1} for note ${noteId} will not be retried further due to permanent error`);
+                    } else {
+                        log.info(`Chunk ${item.index + 1} for note ${noteId} reached maximum retry attempts (${MAX_CHUNK_RETRY_ATTEMPTS})`);
+                    }
+                }
+            }
+        }
+
+        // Log information about the processed chunks
+        if (successfulChunks > 0) {
+            log.info(`[${processingId}] Generated ${successfulChunks} chunk embeddings for note ${noteId} (${note.title})`);
+        }
+
+        if (failedChunks > 0) {
+            // Count permanent vs temporary errors
+            const permanentErrors = failedChunkDetails.filter(d => d.category === 'permanent').length;
+            const temporaryErrors = failedChunkDetails.filter(d => d.category === 'temporary').length;
+            const unknownErrors = failedChunkDetails.filter(d => d.category === 'unknown').length;
+
+            log.info(`[${processingId}] Failed to generate ${failedChunks} chunk embeddings for note ${noteId} (${note.title}). ` +
+                    `Permanent: ${permanentErrors}, Temporary: ${temporaryErrors}, Unknown: ${unknownErrors}`);
+        }
+
+        // Calculate the failure ratio
+        const failureRatio = failedChunks / totalChunks;
+
+        // If no chunks were successfully processed, or if more than 50% failed, mark the entire note as failed
+        if (successfulChunks === 0 || failureRatio > 0.5) {
+            // Check if all failures are permanent
+            const allPermanent = failedChunkDetails.every(d => d.category === 'permanent');
+            const errorType = allPermanent ? 'permanent' : (failureRatio > 0.5 ? 'too_many_failures' : 'all_failed');
+
+            // Mark this note as failed in the embedding_queue table with a permanent error status
+            const now = dateUtils.utcNowDateTime();
+            const errorSummary = `Note embedding failed: ${failedChunks}/${totalChunks} chunks failed (${errorType}). First error: ${failedChunkDetails[0]?.error}`;
+
+            await sql.execute(`
+                UPDATE embedding_queue
+                SET error = ?, lastAttempt = ?, attempts = 999
+                WHERE noteId = ?
+            `, [errorSummary, now, noteId]);
+
+            throw new Error(errorSummary);
+        }
+
+        // If some chunks failed but others succeeded, log a warning but consider the processing complete
+        // The note will be removed from the queue, but we'll store error information
+        if (failedChunks > 0 && successfulChunks > 0) {
+            // Create detailed error summary
+            const permanentErrors = failedChunkDetails.filter(d => d.category === 'permanent').length;
+            const temporaryErrors = failedChunkDetails.filter(d => d.category === 'temporary').length;
+            const unknownErrors = failedChunkDetails.filter(d => d.category === 'unknown').length;
+
+            const errorSummary = `Note processed partially: ${successfulChunks}/${totalChunks} chunks succeeded, ` +
+                               `${failedChunks}/${totalChunks} failed (${permanentErrors} permanent, ${temporaryErrors} temporary, ${unknownErrors} unknown)`;
+            log.info(errorSummary);
+
+            // Store a summary in the error field of embedding_queue
+            // This is just for informational purposes - the note will be removed from the queue
+            const now = dateUtils.utcNowDateTime();
+            await sql.execute(`
+                UPDATE embedding_queue
+                SET error = ?, lastAttempt = ?
+                WHERE noteId = ?
+            `, [errorSummary, now, noteId]);
+        }
+
+        // Track total processing time
+        const totalTime = Date.now() - startTime;
+        log.info(`[${processingId}] Total processing time for note ${noteId}: ${totalTime}ms`);
+
+    } catch (error: any) {
+        log.error(`Error in chunked embedding process for note ${noteId}: ${error.message || 'Unknown error'}`);
+        throw error;
+    }
+}
+
+/**
+ * Process a chunk with retry logic to handle errors
+ * @param index - The chunk index for tracking
+ * @param chunk - The content chunk
+ * @param provider - The embedding provider
+ * @param noteId - ID of the note being processed
+ * @param config - Embedding configuration
+ * @param startTime - When the overall process started
+ * @param storage - The storage module
+ * @param maxTimePerChunk - Max time per chunk processing
+ * @param retryAttempt - Current retry attempt number
+ */
+async function processChunkWithRetry(
+    index: number,
+    chunk: ContentChunk,
+    provider: EmbeddingProvider,
+    noteId: string,
+    config: EmbeddingConfig,
+    startTime: number,
+    storage: typeof import('../storage.js'),
+    maxTimePerChunk: number,
+    retryAttempt = 0
+): Promise<boolean> {
+    try {
+        // Try to generate embedding with timeout
+        const embedding = await processChunkWithTimeout(provider, chunk, maxTimePerChunk);
+
+        // Store the embedding with the chunk ID
+        const chunkId = `${noteId}_chunk${index}`;
+        await storage.storeNoteEmbedding(chunkId, provider.name, config.model, embedding);
+
+        return true;
+    } catch (error: unknown) {
+        const errorMessage = error instanceof Error ? error.message : String(error);
+        const category = categorizeError(errorMessage);
+
+        // If we haven't exceeded the retry limit and it's a temporary error, retry
+        if (retryAttempt < MAX_CHUNK_RETRY_ATTEMPTS && (category === 'temporary' || category === 'unknown')) {
+            // Exponential backoff
+            const delayMs = Math.min(1000 * Math.pow(2, retryAttempt), 15000);
+            log.info(`Retrying chunk ${index} after ${delayMs}ms (attempt ${retryAttempt + 1}/${MAX_CHUNK_RETRY_ATTEMPTS})`);
+            await new Promise(resolve => setTimeout(resolve, delayMs));
+
+            return processChunkWithRetry(
+                index, chunk, provider, noteId, config, startTime, storage, maxTimePerChunk, retryAttempt + 1
+            );
+        } else {
+            log.error(`Failed to process chunk ${index} after ${retryAttempt + 1} attempts: ${errorMessage}`);
+            return false;
+        }
+    }
+}
diff --git a/src/services/llm/embeddings/content_processing.ts b/src/services/llm/embeddings/content_processing.ts
new file mode 100644
index 000000000..cb540dab3
--- /dev/null
+++ b/src/services/llm/embeddings/content_processing.ts
@@ -0,0 +1,327 @@
+import becca from "../../../becca/becca.js";
+import type { NoteEmbeddingContext } from "./types.js";
+import sanitizeHtml from "sanitize-html";
+import type BNote from "../../../becca/entities/bnote.js";
+
+/**
+ * Clean note content by removing HTML tags and normalizing whitespace
+ */
+export async function cleanNoteContent(content: string, type: string, mime: string): Promise<string> {
+    if (!content) return '';
+
+    // If it's HTML content, remove HTML tags
+    if ((type === 'text' && mime === 'text/html') || content.includes('<div>') || content.includes('<p>')) {
+        // Use sanitizeHtml to remove all HTML tags
+        content = sanitizeHtml(content, {
+            allowedTags: [],
+            allowedAttributes: {},
+            textFilter: (text) => {
+                // Normalize the text, removing excessive whitespace
+                return text.replace(/\s+/g, ' ');
+            }
+        });
+    }
+
+    // Additional cleanup for any remaining HTML entities
+    content = content
+        .replace(/&nbsp;/g, ' ')
+        .replace(/&lt;/g, '<')
+        .replace(/&gt;/g, '>')
+        .replace(/&quot;/g, '"')
+        .replace(/&#39;/g, "'")
+        .replace(/&amp;/g, '&');
+
+    // Normalize whitespace (replace multiple spaces/newlines with single space)
+    content = content.replace(/\s+/g, ' ');
+
+    // Trim the content
+    content = content.trim();
+
+    // Import constants directly
+    const { LLM_CONSTANTS } = await import('../constants/provider_constants.js');
+    // Truncate if extremely long
+    if (content.length > LLM_CONSTANTS.CONTENT.MAX_TOTAL_CONTENT_LENGTH) {
+        content = content.substring(0, LLM_CONSTANTS.CONTENT.MAX_TOTAL_CONTENT_LENGTH) + ' [content truncated]';
+    }
+
+    return content;
+}
+
+/**
+ * Extract content from different note types
+ */
+export function extractStructuredContent(content: string, type: string, mime: string): string {
+    try {
+        if (!content) return '';
+
+        // Special handling based on note type
+        switch (type) {
+            case 'mindMap':
+            case 'relationMap':
+            case 'canvas':
+                if (mime === 'application/json') {
+                    const jsonContent = JSON.parse(content);
+
+                    if (type === 'canvas') {
+                        // Extract text elements from canvas
+                        if (jsonContent.elements && Array.isArray(jsonContent.elements)) {
+                            const texts = jsonContent.elements
+                                .filter((element: any) => element.type === 'text' && element.text)
+                                .map((element: any) => element.text);
+                            return texts.join('\n');
+                        }
+                    }
+                    else if (type === 'mindMap') {
+                        // Extract node text from mind map
+                        const extractMindMapNodes = (node: any): string[] => {
+                            let texts: string[] = [];
+                            if (node.text) {
+                                texts.push(node.text);
+                            }
+                            if (node.children && Array.isArray(node.children)) {
+                                for (const child of node.children) {
+                                    texts = texts.concat(extractMindMapNodes(child));
+                                }
+                            }
+                            return texts;
+                        };
+
+                        if (jsonContent.root) {
+                            return extractMindMapNodes(jsonContent.root).join('\n');
+                        }
+                    }
+                    else if (type === 'relationMap') {
+                        // Extract relation map entities and connections
+                        let result = '';
+
+                        if (jsonContent.notes && Array.isArray(jsonContent.notes)) {
+                            result += 'Notes: ' + jsonContent.notes
+                                .map((note: any) => note.title || note.name)
+                                .filter(Boolean)
+                                .join(', ') + '\n';
+                        }
+
+                        if (jsonContent.relations && Array.isArray(jsonContent.relations)) {
+                            result += 'Relations: ' + jsonContent.relations
+                                .map((rel: any) => {
+                                    const sourceNote = jsonContent.notes.find((n: any) => n.noteId === rel.sourceNoteId);
+                                    const targetNote = jsonContent.notes.find((n: any) => n.noteId === rel.targetNoteId);
+                                    const source = sourceNote ? (sourceNote.title || sourceNote.name) : 'unknown';
+                                    const target = targetNote ? (targetNote.title || targetNote.name) : 'unknown';
+                                    return `${source} → ${rel.name || ''} → ${target}`;
+                                })
+                                .join('; ');
+                        }
+
+                        return result;
+                    }
+                }
+                return JSON.stringify(content);
+
+            case 'mermaid':
+                // Return mermaid diagrams as-is (they're human-readable)
+                return content;
+
+            case 'geoMap':
+                if (mime === 'application/json') {
+                    const jsonContent = JSON.parse(content);
+                    let result = '';
+
+                    if (jsonContent.markers && Array.isArray(jsonContent.markers)) {
+                        result += jsonContent.markers
+                            .map((marker: any) => {
+                                return `Location: ${marker.title || ''} (${marker.lat}, ${marker.lng})${marker.description ? ' - ' + marker.description : ''}`;
+                            })
+                            .join('\n');
+                    }
+
+                    return result || JSON.stringify(content);
+                }
+                return JSON.stringify(content);
+
+            case 'file':
+            case 'image':
+                // For files and images, just return a placeholder
+                return `[${type} attachment]`;
+
+            default:
+                return content;
+        }
+    }
+    catch (error) {
+        console.error(`Error extracting content from ${type} note:`, error);
+        return content;
+    }
+}
+
+/**
+ * Gets context for a note to be embedded
+ */
+export async function getNoteEmbeddingContext(noteId: string): Promise<NoteEmbeddingContext> {
+    const note = becca.getNote(noteId);
+
+    if (!note) {
+        throw new Error(`Note ${noteId} not found`);
+    }
+
+    // Get parent note titles
+    const parentNotes = note.getParentNotes();
+    const parentTitles = parentNotes.map(note => note.title);
+
+    // Get child note titles
+    const childNotes = note.getChildNotes();
+    const childTitles = childNotes.map(note => note.title);
+
+    // Get all attributes (not just owned ones)
+    const attributes = note.getAttributes().map(attr => ({
+        type: attr.type,
+        name: attr.name,
+        value: attr.value
+    }));
+
+    // Get backlinks (notes that reference this note through relations)
+    const targetRelations = note.getTargetRelations();
+    const backlinks = targetRelations
+        .map(relation => {
+            const sourceNote = relation.getNote();
+            if (sourceNote && sourceNote.type !== 'search') { // Filter out search notes
+                return {
+                    sourceNoteId: sourceNote.noteId,
+                    sourceTitle: sourceNote.title,
+                    relationName: relation.name
+                };
+            }
+            return null;
+        })
+        .filter((item): item is { sourceNoteId: string; sourceTitle: string; relationName: string } => item !== null);
+
+    // Get related notes through relations
+    const relations = note.getRelations();
+    const relatedNotes = relations
+        .map(relation => {
+            const targetNote = relation.targetNote;
+            if (targetNote) {
+                return {
+                    targetNoteId: targetNote.noteId,
+                    targetTitle: targetNote.title,
+                    relationName: relation.name
+                };
+            }
+            return null;
+        })
+        .filter((item): item is { targetNoteId: string; targetTitle: string; relationName: string } => item !== null);
+
+    // Extract important labels that might affect semantics
+    const labelValues: Record<string, string> = {};
+    const labels = note.getLabels();
+    for (const label of labels) {
+        // Skip CSS and UI-related labels that don't affect semantics
+        if (!label.name.startsWith('css') &&
+            !label.name.startsWith('workspace') &&
+            !label.name.startsWith('hide') &&
+            !label.name.startsWith('collapsed')) {
+            labelValues[label.name] = label.value;
+        }
+    }
+
+    // Get attachments
+    const attachments = note.getAttachments().map(att => ({
+        title: att.title,
+        mime: att.mime
+    }));
+
+    // Get content
+    let content = "";
+
+    try {
+        // Use the enhanced context extractor for improved content extraction
+        // We're using a dynamic import to avoid circular dependencies
+        const { ContextExtractor } = await import('../../llm/context/index.js');
+        const contextExtractor = new ContextExtractor();
+
+        // Get the content using the enhanced formatNoteContent method in context extractor
+        const noteContent = await contextExtractor.getNoteContent(noteId);
+
+        if (noteContent) {
+            content = noteContent;
+
+            // For large content, consider chunking or summarization
+            if (content.length > 10000) {
+                // Large content handling options:
+
+                // Option 1: Use our summarization feature
+                const summary = await contextExtractor.getNoteSummary(noteId);
+                if (summary) {
+                    content = summary;
+                }
+
+                // Option 2: Alternative approach - use the first chunk if summarization fails
+                if (content.length > 10000) {
+                    const chunks = await contextExtractor.getChunkedNoteContent(noteId);
+                    if (chunks && chunks.length > 0) {
+                        // Use the first chunk (most relevant/beginning)
+                        content = chunks[0];
+                    }
+                }
+            }
+        } else {
+            // Fallback to original method if context extractor fails
+            const rawContent = String(await note.getContent() || "");
+
+            // Process the content based on note type to extract meaningful text
+            if (note.type === 'text' || note.type === 'code') {
+                content = rawContent;
+            } else if (['canvas', 'mindMap', 'relationMap', 'mermaid', 'geoMap'].includes(note.type)) {
+                // Process structured content types
+                content = extractStructuredContent(rawContent, note.type, note.mime);
+            } else if (note.type === 'image' || note.type === 'file') {
+                content = `[${note.type} attachment: ${note.mime}]`;
+            }
+
+            // Clean the content to remove HTML tags and normalize whitespace
+            content = await cleanNoteContent(content, note.type, note.mime);
+        }
+    } catch (err) {
+        console.error(`Error getting content for note ${noteId}:`, err);
+        content = `[Error extracting content]`;
+
+        // Try fallback to original method
+        try {
+            const rawContent = String(await note.getContent() || "");
+            if (note.type === 'text' || note.type === 'code') {
+                content = rawContent;
+            } else if (['canvas', 'mindMap', 'relationMap', 'mermaid', 'geoMap'].includes(note.type)) {
+                content = extractStructuredContent(rawContent, note.type, note.mime);
+            }
+            content = await cleanNoteContent(content, note.type, note.mime);
+        } catch (fallbackErr) {
+            console.error(`Fallback content extraction also failed for note ${noteId}:`, fallbackErr);
+        }
+    }
+
+    // Get template/inheritance relationships
+    // This is from FNote.getNotesToInheritAttributesFrom - recreating similar logic for BNote
+    const templateRelations = note.getRelations('template').concat(note.getRelations('inherit'));
+    const templateTitles = templateRelations
+        .map(rel => rel.targetNote)
+        .filter((note): note is BNote => note !== undefined)
+        .map(templateNote => templateNote.title);
+
+    return {
+        noteId: note.noteId,
+        title: note.title,
+        content: content,
+        type: note.type,
+        mime: note.mime,
+        dateCreated: note.dateCreated || "",
+        dateModified: note.dateModified || "",
+        attributes,
+        parentTitles,
+        childTitles,
+        attachments,
+        backlinks,
+        relatedNotes,
+        labelValues,
+        templateTitles
+    };
+}
diff --git a/src/services/llm/embeddings/embeddings_interface.ts b/src/services/llm/embeddings/embeddings_interface.ts
new file mode 100644
index 000000000..2731aef0d
--- /dev/null
+++ b/src/services/llm/embeddings/embeddings_interface.ts
@@ -0,0 +1,136 @@
+import type { NoteType, AttributeType } from "../../../becca/entities/rows.js";
+
+/**
+ * Represents the context of a note that will be embedded
+ */
+export interface NoteEmbeddingContext {
+    noteId: string;
+    title: string;
+    content: string;
+    type: NoteType;
+    mime: string;
+    dateCreated: string;
+    dateModified: string;
+    attributes: {
+        type: AttributeType;
+        name: string;
+        value: string;
+    }[];
+    parentTitles: string[];
+    childTitles: string[];
+    attachments: {
+        title: string;
+        mime: string;
+    }[];
+    backlinks?: {
+        sourceNoteId: string;
+        sourceTitle: string;
+        relationName: string;
+    }[];
+    relatedNotes?: {
+        targetNoteId: string;
+        targetTitle: string;
+        relationName: string;
+    }[];
+    labelValues?: Record<string, string>;
+    templateTitles?: string[];
+}
+
+/**
+ * Information about an embedding model's capabilities
+ */
+export interface EmbeddingModelInfo {
+    dimension: number;
+    contextWindow: number;
+    /**
+     * Whether the model guarantees normalized vectors (unit length)
+     */
+    guaranteesNormalization: boolean;
+}
+
+/**
+ * Normalization status of a provider's embeddings
+ */
+export enum NormalizationStatus {
+    /**
+     * Provider guarantees all embeddings are normalized to unit vectors
+     */
+    GUARANTEED = 'guaranteed',
+
+    /**
+     * Provider does not guarantee normalization, but embeddings are usually normalized
+     */
+    USUALLY = 'usually',
+
+    /**
+     * Provider does not guarantee normalization, embeddings must be normalized before use
+     */
+    NEVER = 'never',
+
+    /**
+     * Normalization status is unknown and should be checked at runtime
+     */
+    UNKNOWN = 'unknown'
+}
+
+/**
+ * Configuration for how embeddings should be generated
+ */
+export interface EmbeddingConfig {
+    model: string;
+    dimension: number;
+    type: 'float32' | 'float64';
+    /**
+     * Whether embeddings should be normalized before use
+     * If true, normalization will always be applied
+     * If false, normalization depends on provider's status
+     */
+    normalize?: boolean;
+    /**
+     * The normalization status of this provider
+     */
+    normalizationStatus?: NormalizationStatus;
+    batchSize?: number;
+    contextWindowSize?: number;
+    apiKey?: string;
+    baseUrl?: string;
+}
+
+/**
+ * Core interface that all embedding providers must implement
+ */
+export interface EmbeddingProvider {
+    name: string;
+    getConfig(): EmbeddingConfig;
+
+    /**
+     * Returns information about the normalization status of this provider
+     */
+    getNormalizationStatus(): NormalizationStatus;
+
+    /**
+     * Verify that embeddings are properly normalized
+     * @returns true if embeddings are properly normalized
+     */
+    verifyNormalization?(sample?: Float32Array): Promise<boolean>;
+
+    /**
+     * Generate embeddings for a single piece of text
+     */
+    generateEmbeddings(text: string): Promise<Float32Array>;
+
+    /**
+     * Generate embeddings for multiple pieces of text in batch
+     */
+    generateBatchEmbeddings(texts: string[]): Promise<Float32Array[]>;
+
+    /**
+     * Generate embeddings for a note with its full context
+     */
+    generateNoteEmbeddings(context: NoteEmbeddingContext): Promise<Float32Array>;
+
+    /**
+     * Generate embeddings for multiple notes with their contexts in batch
+     */
+    generateBatchNoteEmbeddings(contexts: NoteEmbeddingContext[]): Promise<Float32Array[]>;
+}
diff --git a/src/services/llm/embeddings/events.ts b/src/services/llm/embeddings/events.ts
new file mode 100644
index 000000000..a078b2c32
--- /dev/null
+++ b/src/services/llm/embeddings/events.ts
@@ -0,0 +1,92 @@
+import sql from "../../../services/sql.js";
+import log from "../../../services/log.js";
+import options from "../../../services/options.js";
+import cls from "../../../services/cls.js";
+import { processEmbeddingQueue, queueNoteForEmbedding } from "./queue.js";
+import eventService from "../../../services/events.js";
+import becca from "../../../becca/becca.js";
+
+// Add mutex to prevent concurrent processing
+let isProcessingEmbeddings = false;
+
+/**
+ * Setup event listeners for embedding-related events
+ */
+export function setupEmbeddingEventListeners() {
+    // Listen for note content changes
+    eventService.subscribe(eventService.NOTE_CONTENT_CHANGE, ({ entity }) => {
+        if (entity && entity.noteId) {
+            queueNoteForEmbedding(entity.noteId);
+        }
+    });
+
+    // Listen for new notes
+    eventService.subscribe(eventService.ENTITY_CREATED, ({ entityName, entity }) => {
+        if (entityName === "notes" && entity && entity.noteId) {
+            queueNoteForEmbedding(entity.noteId);
+        }
+    });
+
+    // Listen for note title changes
+    eventService.subscribe(eventService.NOTE_TITLE_CHANGED, ({ noteId }) => {
+        if (noteId) {
+            queueNoteForEmbedding(noteId);
+        }
+    });
+
+    // Listen for note deletions
+    eventService.subscribe(eventService.ENTITY_DELETED, ({ entityName, entityId }) => {
+        if (entityName === "notes" && entityId) {
+            queueNoteForEmbedding(entityId, 'DELETE');
+        }
+    });
+
+    // Listen for attribute changes that might affect context
+    eventService.subscribe(eventService.ENTITY_CHANGED, ({ entityName, entity }) => {
+        if (entityName === "attributes" && entity && entity.noteId) {
+            queueNoteForEmbedding(entity.noteId);
+        }
+    });
+}
+
+/**
+ * Setup background processing of the embedding queue
+ */
+export async function setupEmbeddingBackgroundProcessing() {
+    const interval = parseInt(await options.getOption('embeddingUpdateInterval') || '200', 10);
+
+    setInterval(async () => {
+        try {
+            // Skip if already processing
+            if (isProcessingEmbeddings) {
+                return;
+            }
+
+            // Set mutex
+            isProcessingEmbeddings = true;
+
+            // Wrap in cls.init to ensure proper context
+            cls.init(async () => {
+                await processEmbeddingQueue();
+            });
+        } catch (error: any) {
+            log.error(`Error in background embedding processing: ${error.message || 'Unknown error'}`);
+        } finally {
+            // Always release the mutex
+            isProcessingEmbeddings = false;
+        }
+    }, interval);
+}
+
+/**
+ * Initialize embeddings system
+ */
+export async function initEmbeddings() {
+    if (await options.getOptionBool('aiEnabled')) {
+        setupEmbeddingEventListeners();
+        await setupEmbeddingBackgroundProcessing();
+        log.info("Embeddings system initialized");
+    } else {
+        log.info("Embeddings system disabled");
+    }
+}
diff --git a/src/services/llm/embeddings/index.ts b/src/services/llm/embeddings/index.ts
new file mode 100644
index 000000000..89d0f711e
--- /dev/null
+++ b/src/services/llm/embeddings/index.ts
@@ -0,0 +1,112 @@
+// Re-export all modules for easy access
+import * as vectorUtils from './vector_utils.js';
+import * as storage from './storage.js';
+import * as contentProcessing from './content_processing.js';
+import * as queue from './queue.js';
+// Import chunking dynamically to prevent circular dependencies
+// import * as chunking from './chunking.js';
+import * as events from './events.js';
+import * as stats from './stats.js';
+import * as indexOperations from './index_operations.js';
+import { getChunkingOperations } from './chunking/chunking_interface.js';
+import type { NoteEmbeddingContext } from './types.js';
+
+// Export types
+export * from './types.js';
+
+// Maintain backward compatibility by exposing all functions at the top level
+export const {
+    cosineSimilarity,
+    embeddingToBuffer,
+    bufferToEmbedding,
+    adaptEmbeddingDimensions,
+    enhancedCosineSimilarity,
+    selectOptimalEmbedding
+} = vectorUtils;
+
+export const {
+    storeNoteEmbedding,
+    getEmbeddingForNote,
+    findSimilarNotes,
+    deleteNoteEmbeddings
+} = storage;
+
+export const {
+    getNoteEmbeddingContext,
+    cleanNoteContent,
+    extractStructuredContent
+} = contentProcessing;
+
+export const {
+    queueNoteForEmbedding,
+    getFailedEmbeddingNotes,
+    retryFailedEmbedding,
+    retryAllFailedEmbeddings,
+    processEmbeddingQueue
+} = queue;
+
+// Export chunking function using the interface to break circular dependencies
+export const processNoteWithChunking = async (
+    noteId: string,
+    provider: any,
+    context: NoteEmbeddingContext
+): Promise<void> => {
+    const chunkingOps = await getChunkingOperations();
+    return chunkingOps.processNoteWithChunking(noteId, provider, context);
+};
+
+export const {
+    setupEmbeddingEventListeners,
+    setupEmbeddingBackgroundProcessing,
+    initEmbeddings
+} = events;
+
+export const {
+    getEmbeddingStats,
+    reprocessAllNotes,
+    cleanupEmbeddings
+} = stats;
+
+export const {
+    rebuildSearchIndex
+} = indexOperations;
+
+// Default export for backward compatibility
+export default {
+    // Vector utils
+    cosineSimilarity: vectorUtils.cosineSimilarity,
+    embeddingToBuffer: vectorUtils.embeddingToBuffer,
+    bufferToEmbedding: vectorUtils.bufferToEmbedding,
+
+    // Storage
+    storeNoteEmbedding: storage.storeNoteEmbedding,
+    getEmbeddingForNote: storage.getEmbeddingForNote,
+    findSimilarNotes: storage.findSimilarNotes,
+    deleteNoteEmbeddings: storage.deleteNoteEmbeddings,
+
+    // Content processing
+    getNoteEmbeddingContext: contentProcessing.getNoteEmbeddingContext,
+
+    // Queue management
+    queueNoteForEmbedding: queue.queueNoteForEmbedding,
+    processEmbeddingQueue: queue.processEmbeddingQueue,
+    getFailedEmbeddingNotes: queue.getFailedEmbeddingNotes,
+    retryFailedEmbedding: queue.retryFailedEmbedding,
+    retryAllFailedEmbeddings: queue.retryAllFailedEmbeddings,
+
+    // Chunking - use the dynamic wrapper
+    processNoteWithChunking,
+
+    // Event handling
+    setupEmbeddingEventListeners: events.setupEmbeddingEventListeners,
+    setupEmbeddingBackgroundProcessing: events.setupEmbeddingBackgroundProcessing,
+    initEmbeddings: events.initEmbeddings,
+
+    // Stats and maintenance
+    getEmbeddingStats: stats.getEmbeddingStats,
+    reprocessAllNotes: stats.reprocessAllNotes,
+    cleanupEmbeddings: stats.cleanupEmbeddings,
+
+    // Index operations
+    rebuildSearchIndex: indexOperations.rebuildSearchIndex
+};
diff --git a/src/services/llm/embeddings/index_operations.ts b/src/services/llm/embeddings/index_operations.ts
new file mode 100644
index 000000000..19fdd4bb1
--- /dev/null
+++ b/src/services/llm/embeddings/index_operations.ts
@@ -0,0 +1,107 @@
+import sql from "../../../services/sql.js";
+import log from "../../../services/log.js";
+import dateUtils from "../../../services/date_utils.js";
+import { bufferToEmbedding } from "./vector_utils.js";
+import indexService from "../index_service.js";
+
+/**
+ * Rebuilds the search index structure without regenerating embeddings.
+ * This optimizes the existing embeddings for faster searches.
+ *
+ * @returns The number of embeddings processed
+ */
+export async function rebuildSearchIndex(): Promise<number> {
+    log.info("Starting search index rebuild");
+    const startTime = Date.now();
+
+    try {
+        // 1. Get count of all existing embeddings to track progress
+        const totalEmbeddings = await sql.getValue(
+            "SELECT COUNT(*) FROM note_embeddings"
+        ) as number;
+
+        if (totalEmbeddings === 0) {
+            log.info("No embeddings found to rebuild index for");
+            return 0;
+        }
+
+        log.info(`Found ${totalEmbeddings} embeddings to process`);
+
+        // 2. Process embeddings in batches to avoid memory issues
+        const batchSize = 100;
+        let processed = 0;
+
+        // Get unique provider/model combinations
+        const providerModels = await sql.getRows(
+            "SELECT DISTINCT providerId, modelId FROM note_embeddings"
+        ) as {providerId: string, modelId: string}[];
+
+        // Process each provider/model combination
+        for (const {providerId, modelId} of providerModels) {
+            log.info(`Processing embeddings for provider: ${providerId}, model: ${modelId}`);
+
+            // Get embeddings for this provider/model in batches
+            let offset = 0;
+            while (true) {
+                const embeddings = await sql.getRows(`
+                    SELECT embedId, noteId, dimension, embedding, dateModified
+                    FROM note_embeddings
+                    WHERE providerId = ? AND modelId = ?
+                    ORDER BY noteId
+                    LIMIT ? OFFSET ?`,
+                    [providerId, modelId, batchSize, offset]
+                ) as any[];
+
+                if (embeddings.length === 0) {
+                    break;
+                }
+
+                // Process this batch of embeddings
+                for (const embedding of embeddings) {
+                    try {
+                        // Convert buffer to embedding for processing
+                        const vector = bufferToEmbedding(embedding.embedding, embedding.dimension);
+
+                        // Optimize this embedding (in a real system, this might involve:
+                        // - Adding to an optimized index structure
+                        // - Normalizing vectors
+                        // - Updating index metadata
+                        // For this implementation, we'll just "touch" the record to simulate optimization)
+                        await sql.execute(`
+                            UPDATE note_embeddings
+                            SET dateModified = ?, utcDateModified = ?
+                            WHERE embedId = ?`,
+                            [dateUtils.localNowDateTime(), dateUtils.utcNowDateTime(), embedding.embedId]
+                        );
+
+                        processed++;
+
+                        // Update progress every 10 embeddings
+                        if (processed % 10 === 0) {
+                            indexService.updateIndexRebuildProgress(10);
+
+                            // Log progress every 100 embeddings
+                            if (processed % 100 === 0) {
+                                const percent = Math.round((processed / totalEmbeddings) * 100);
+                                log.info(`Index rebuild progress: ${percent}% (${processed}/${totalEmbeddings})`);
+                            }
+                        }
+                    } catch (error: any) {
+                        log.error(`Error processing embedding ${embedding.embedId}: ${error.message || "Unknown error"}`);
+                    }
+                }
+
+                offset += embeddings.length;
+            }
+        }
+
+        // 3. Finalize - could involve additional optimization steps
+        const duration = Math.round((Date.now() - startTime) / 1000);
+        log.info(`Index rebuild completed: processed ${processed} embeddings in ${duration} seconds`);
+
+        return processed;
+    } catch (error: any) {
+        log.error(`Error during index rebuild: ${error.message || "Unknown error"}`);
+        throw error;
+    }
+}
diff --git a/src/services/llm/embeddings/init.ts b/src/services/llm/embeddings/init.ts
new file mode 100644
index 000000000..50724c05e
--- /dev/null
+++ b/src/services/llm/embeddings/init.ts
@@ -0,0 +1,59 @@
+import log from "../../log.js";
+import options from "../../options.js";
+import { initEmbeddings } from "./index.js";
+import providerManager from "../providers/providers.js";
+import sqlInit from "../../sql_init.js";
+import sql from "../../sql.js";
+
+/**
+ * Reset any stuck embedding queue items that were left in processing state
+ * from a previous server shutdown
+ */
+async function resetStuckEmbeddingQueue() {
+    try {
+        const stuckCount = await sql.getValue(
+            "SELECT COUNT(*) FROM embedding_queue WHERE isProcessing = 1"
+        ) as number;
+
+        if (stuckCount > 0) {
+            log.info(`Resetting ${stuckCount} stuck items in embedding queue from previous shutdown`);
+
+            await sql.execute(
+                "UPDATE embedding_queue SET isProcessing = 0 WHERE isProcessing = 1"
+            );
+        }
+    } catch (error: any) {
+        log.error(`Error resetting stuck embedding queue: ${error.message || error}`);
+    }
+}
+
+/**
+ * Initialize the embedding system
+ */
+export async function initializeEmbeddings() {
+    try {
+        log.info("Initializing embedding system...");
+
+        // Check if the database is initialized before proceeding
+        if (!sqlInit.isDbInitialized()) {
+            log.info("Skipping embedding system initialization as database is not initialized yet.");
+            return;
+        }
+
+        // Reset any stuck embedding queue items from previous server shutdown
+        await resetStuckEmbeddingQueue();
+
+        // Initialize default embedding providers
+        await providerManager.initializeDefaultProviders();
+
+        // Start the embedding system if AI is enabled
+        if (await options.getOptionBool('aiEnabled')) {
+            await initEmbeddings();
+            log.info("Embedding system initialized successfully.");
+        } else {
+            log.info("Embedding system disabled (AI features are turned off).");
+        }
+    } catch (error: any) {
+        log.error(`Error initializing embedding system: ${error.message || error}`);
+    }
+}
diff --git a/src/services/llm/embeddings/providers/local.ts b/src/services/llm/embeddings/providers/local.ts
new file mode 100644
index 000000000..1477af40e
--- /dev/null
+++ b/src/services/llm/embeddings/providers/local.ts
@@ -0,0 +1,73 @@
+import { BaseEmbeddingProvider } from "../base_embeddings.js";
+import type { EmbeddingConfig } from "../embeddings_interface.js";
+import crypto from "crypto";
+
+/**
+ * Local embedding provider implementation
+ *
+ * This is a fallback provider that generates simple deterministic embeddings
+ * using cryptographic hashing. These are not semantic vectors but can be used
+ * for exact matches when no other providers are available.
+ */
+export class LocalEmbeddingProvider extends BaseEmbeddingProvider {
+    name = "local";
+
+    constructor(config: EmbeddingConfig) {
+        super(config);
+    }
+
+    /**
+     * Generate a simple embedding by hashing the text
+     */
+    async generateEmbeddings(text: string): Promise<Float32Array> {
+        const dimension = this.config.dimension || 384;
+        const result = new Float32Array(dimension);
+
+        // Generate a hash of the input text
+        const hash = crypto.createHash('sha256').update(text).digest();
+
+        // Use the hash to seed a deterministic PRNG
+        let seed = 0;
+        for (let i = 0; i < hash.length; i += 4) {
+            seed = (seed * 65536 + hash.readUInt32LE(i % (hash.length - 3))) >>> 0;
+        }
+
+        // Generate pseudo-random but deterministic values for the embedding
+        for (let i = 0; i < dimension; i++) {
+            // Generate next pseudo-random number
+            seed = (seed * 1664525 + 1013904223) >>> 0;
+
+            // Convert to a float between -1 and 1
+            result[i] = (seed / 2147483648) - 1;
+        }
+
+        // Normalize the vector
+        let magnitude = 0;
+        for (let i = 0; i < dimension; i++) {
+            magnitude += result[i] * result[i];
+        }
+
+        magnitude = Math.sqrt(magnitude);
+        if (magnitude > 0) {
+            for (let i = 0; i < dimension; i++) {
+                result[i] /= magnitude;
+            }
+        }
+
+        return result;
+    }
+
+    /**
+     * Generate embeddings for multiple texts
+     */
+    async generateBatchEmbeddings(texts: string[]): Promise<Float32Array[]> {
+        const results: Float32Array[] = [];
+
+        for (const text of texts) {
+            const embedding = await this.generateEmbeddings(text);
+            results.push(embedding);
+        }
+
+        return results;
+    }
+}
diff --git a/src/services/llm/embeddings/providers/ollama.ts b/src/services/llm/embeddings/providers/ollama.ts
new file mode 100644
index 000000000..aa2c70589
--- /dev/null
+++ b/src/services/llm/embeddings/providers/ollama.ts
@@ -0,0 +1,324 @@
+import log from "../../../log.js";
+import { BaseEmbeddingProvider } from "../base_embeddings.js";
+import type { EmbeddingConfig } from "../embeddings_interface.js";
+import { NormalizationStatus } from "../embeddings_interface.js";
+import { LLM_CONSTANTS } from "../../constants/provider_constants.js";
+import type { EmbeddingModelInfo } from "../../interfaces/embedding_interfaces.js";
+import { Ollama } from "ollama";
+
+/**
+ * Ollama embedding provider implementation using the official Ollama client
+ */
+export class OllamaEmbeddingProvider extends BaseEmbeddingProvider {
+    name = "ollama";
+    private client: Ollama | null = null;
+
+    constructor(config: EmbeddingConfig) {
+        super(config);
+    }
+
+    /**
+     * Get the Ollama client instance
+     */
+    private getClient(): Ollama {
+        if (!this.client) {
+            this.client = new Ollama({ host: this.baseUrl });
+        }
+        return this.client;
+    }
+
+    /**
+     * Initialize the provider by detecting model capabilities
+     */
+    async initialize(): Promise<void> {
+        const modelName = this.config.model || "llama3";
+        try {
+            // Detect model capabilities
+            const modelInfo = await this.getModelInfo(modelName);
+
+            // Update the config dimension
+            this.config.dimension = modelInfo.dimension;
+
+            log.info(`Ollama model ${modelName} initialized with dimension ${this.config.dimension} and context window ${modelInfo.contextWidth}`);
+        } catch (error: any) {
+            log.error(`Error initializing Ollama provider: ${error.message}`);
+        }
+    }
+
+    /**
+     * Fetch detailed model information from Ollama API
+     * @param modelName The name of the model to fetch information for
+     */
+    private async fetchModelCapabilities(modelName: string): Promise<EmbeddingModelInfo | null> {
+        try {
+            const client = this.getClient();
+            
+            // Get model info using the client's show method
+            const modelData = await client.show({ model: modelName });
+
+            if (modelData && modelData.parameters) {
+                const params = modelData.parameters as any;
+                // Extract context length from parameters (different models might use different parameter names)
+                const contextWindow = params.context_length ||
+                                     params.num_ctx ||
+                                     params.context_window ||
+                                     (LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>).default;
+
+                // Some models might provide embedding dimensions
+                const embeddingDimension = params.embedding_length || params.dim || null;
+
+                log.info(`Fetched Ollama model info for ${modelName}: context window ${contextWindow}`);
+
+                return {
+                    name: modelName,
+                    dimension: embeddingDimension || 0, // We'll detect this separately if not provided
+                    contextWidth: contextWindow,
+                    type: 'float32'
+                };
+            }
+        } catch (error: any) {
+            log.info(`Could not fetch model info from Ollama API: ${error.message}. Will try embedding test.`);
+            // We'll fall back to embedding test if this fails
+        }
+
+        return null;
+    }
+
+    /**
+     * Get model information by probing the API
+     */
+    async getModelInfo(modelName: string): Promise<EmbeddingModelInfo> {
+        // Check cache first
+        if (this.modelInfoCache.has(modelName)) {
+            return this.modelInfoCache.get(modelName)!;
+        }
+
+        // Try to fetch model capabilities from API
+        const apiModelInfo = await this.fetchModelCapabilities(modelName);
+        if (apiModelInfo) {
+            // If we have context window but no embedding dimension, we need to detect the dimension
+            if (apiModelInfo.contextWidth && !apiModelInfo.dimension) {
+                try {
+                    // Detect dimension with a test embedding
+                    const dimension = await this.detectEmbeddingDimension(modelName);
+                    apiModelInfo.dimension = dimension;
+                } catch (error) {
+                    // If dimension detection fails, fall back to defaults
+                    const baseModelName = modelName.split(':')[0];
+                    apiModelInfo.dimension = (LLM_CONSTANTS.OLLAMA_MODEL_DIMENSIONS as Record<string, number>)[baseModelName] ||
+                                           (LLM_CONSTANTS.OLLAMA_MODEL_DIMENSIONS as Record<string, number>).default;
+                }
+            }
+
+            // Cache and return the API-provided info
+            this.modelInfoCache.set(modelName, apiModelInfo);
+            this.config.dimension = apiModelInfo.dimension;
+            return apiModelInfo;
+        }
+
+        // If API info fetch fails, fall back to test embedding
+        try {
+            const dimension = await this.detectEmbeddingDimension(modelName);
+            const baseModelName = modelName.split(':')[0];
+            const contextWindow = (LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>)[baseModelName] ||
+                                (LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>).default;
+
+            const modelInfo: EmbeddingModelInfo = {
+                name: modelName,
+                dimension,
+                contextWidth: contextWindow,
+                type: 'float32'
+            };
+            this.modelInfoCache.set(modelName, modelInfo);
+            this.config.dimension = dimension;
+
+            log.info(`Detected Ollama model ${modelName} with dimension ${dimension} (context: ${contextWindow})`);
+            return modelInfo;
+        } catch (error: any) {
+            log.error(`Error detecting Ollama model capabilities: ${error.message}`);
+
+            // If all detection fails, use defaults based on model name
+            const baseModelName = modelName.split(':')[0];
+            const dimension = (LLM_CONSTANTS.OLLAMA_MODEL_DIMENSIONS as Record<string, number>)[baseModelName] ||
+                            (LLM_CONSTANTS.OLLAMA_MODEL_DIMENSIONS as Record<string, number>).default;
+            const contextWindow = (LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>)[baseModelName] ||
+                                (LLM_CONSTANTS.OLLAMA_MODEL_CONTEXT_WINDOWS as Record<string, number>).default;
+
+            log.info(`Using default parameters for model ${modelName}: dimension ${dimension}, context ${contextWindow}`);
+
+            const modelInfo: EmbeddingModelInfo = {
+                name: modelName,
+                dimension,
+                contextWidth: contextWindow,
+                type: 'float32'
+            };
+            this.modelInfoCache.set(modelName, modelInfo);
+            this.config.dimension = dimension;
+
+            return modelInfo;
+        }
+    }
+
+    /**
+     * Detect embedding dimension by making a test API call
+     */
+    private async detectEmbeddingDimension(modelName: string): Promise<number> {
+        try {
+            const client = this.getClient();
+            const embedResponse = await client.embeddings({
+                model: modelName,
+                prompt: "Test"
+            });
+            
+            if (embedResponse && Array.isArray(embedResponse.embedding)) {
+                return embedResponse.embedding.length;
+            } else {
+                throw new Error("Could not detect embedding dimensions");
+            }
+        } catch (error) {
+            throw new Error(`Failed to detect embedding dimensions: ${error}`);
+        }
+    }
+
+    /**
+     * Get the current embedding dimension
+     */
+    getDimension(): number {
+        return this.config.dimension;
+    }
+
+    /**
+     * Generate embeddings for a single text
+     */
+    async generateEmbeddings(text: string): Promise<Float32Array> {
+        // Handle empty text
+        if (!text.trim()) {
+            return new Float32Array(this.config.dimension);
+        }
+
+        // Configuration for retries
+        const maxRetries = 3;
+        let retryCount = 0;
+        let lastError: any = null;
+
+        while (retryCount <= maxRetries) {
+            try {
+                const modelName = this.config.model || "llama3";
+
+                // Ensure we have model info
+                const modelInfo = await this.getModelInfo(modelName);
+
+                // Trim text if it might exceed context window (rough character estimate)
+                // This is a simplistic approach - ideally we'd count tokens properly
+                const charLimit = (modelInfo.contextWidth || 8192) * 4; // Rough estimate: avg 4 chars per token
+                const trimmedText = text.length > charLimit ? text.substring(0, charLimit) : text;
+
+                const client = this.getClient();
+                const response = await client.embeddings({
+                    model: modelName,
+                    prompt: trimmedText
+                });
+
+                if (response && Array.isArray(response.embedding)) {
+                    // Success! Return the embedding
+                    return new Float32Array(response.embedding);
+                } else {
+                    throw new Error("Unexpected response structure from Ollama API");
+                }
+            } catch (error: any) {
+                lastError = error;
+                // Only retry on timeout or connection errors
+                const errorMessage = error.message || "Unknown error";
+                const isTimeoutError = errorMessage.includes('timeout') ||
+                                     errorMessage.includes('socket hang up') ||
+                                     errorMessage.includes('ECONNREFUSED') ||
+                                     errorMessage.includes('ECONNRESET') ||
+                                     errorMessage.includes('AbortError') ||
+                                     errorMessage.includes('NetworkError');
+
+                if (isTimeoutError && retryCount < maxRetries) {
+                    // Exponential backoff with jitter
+                    const delay = Math.min(Math.pow(2, retryCount) * 1000 + Math.random() * 1000, 15000);
+                    log.info(`Ollama embedding timeout, retrying in ${Math.round(delay/1000)}s (attempt ${retryCount + 1}/${maxRetries})`);
+                    await new Promise(resolve => setTimeout(resolve, delay));
+                    retryCount++;
+                } else {
+                    // Non-retryable error or max retries exceeded
+                    const errorMessage = error.message || "Unknown error";
+                    log.error(`Ollama embedding error: ${errorMessage}`);
+                    throw new Error(`Ollama embedding error: ${errorMessage}`);
+                }
+            }
+        }
+
+        // If we get here, we've exceeded our retry limit
+        const errorMessage = lastError.message || "Unknown error";
+        log.error(`Ollama embedding error after ${maxRetries} retries: ${errorMessage}`);
+        throw new Error(`Ollama embedding error after ${maxRetries} retries: ${errorMessage}`);
+    }
+
+    /**
+     * More specific implementation of batch size error detection for Ollama
+     */
+    protected isBatchSizeError(error: any): boolean {
+        const errorMessage = error?.message || '';
+        const ollamaBatchSizeErrorPatterns = [
+            'context length', 'token limit', 'out of memory',
+            'too large', 'overloaded', 'prompt too long',
+            'too many tokens', 'maximum size'
+        ];
+
+        return ollamaBatchSizeErrorPatterns.some(pattern =>
+            errorMessage.toLowerCase().includes(pattern.toLowerCase())
+        );
+    }
+
+    /**
+     * Generate embeddings for multiple texts
+     *
+     * Note: Ollama API doesn't support batch embedding, so we process them sequentially
+     * but using the adaptive batch processor to handle rate limits and retries
+     */
+    async generateBatchEmbeddings(texts: string[]): Promise<Float32Array[]> {
+        if (texts.length === 0) {
+            return [];
+        }
+
+        try {
+            return await this.processWithAdaptiveBatch(
+                texts,
+                async (batch) => {
+                    const results: Float32Array[] = [];
+
+                    // For Ollama, we have to process one at a time
+                    for (const text of batch) {
+                        // Skip empty texts
+                        if (!text.trim()) {
+                            results.push(new Float32Array(this.config.dimension));
+                            continue;
+                        }
+
+                        const embedding = await this.generateEmbeddings(text);
+                        results.push(embedding);
+                    }
+
+                    return results;
+                },
+                this.isBatchSizeError
+            );
+        }
+        catch (error: any) {
+            const errorMessage = error.message || "Unknown error";
+            log.error(`Ollama batch embedding error: ${errorMessage}`);
+            throw new Error(`Ollama batch embedding error: ${errorMessage}`);
+        }
+    }
+
+    /**
+     * Returns the normalization status for Ollama embeddings
+     * Ollama embeddings are not guaranteed to be normalized
+     */
+    getNormalizationStatus(): NormalizationStatus {
+        return NormalizationStatus.NEVER; // Be conservative and always normalize
+    }
+}
diff --git a/src/services/llm/embeddings/providers/openai.ts b/src/services/llm/embeddings/providers/openai.ts
new file mode 100644
index 000000000..7e7782e72
--- /dev/null
+++ b/src/services/llm/embeddings/providers/openai.ts
@@ -0,0 +1,318 @@
+import log from "../../../log.js";
+import { BaseEmbeddingProvider } from "../base_embeddings.js";
+import type { EmbeddingConfig } from "../embeddings_interface.js";
+import { NormalizationStatus } from "../embeddings_interface.js";
+import { LLM_CONSTANTS } from "../../constants/provider_constants.js";
+import type { EmbeddingModelInfo } from "../../interfaces/embedding_interfaces.js";
+import OpenAI from "openai";
+import { PROVIDER_EMBEDDING_CAPABILITIES } from '../../constants/search_constants.js';
+
+/**
+ * OpenAI embedding provider implementation using the official SDK
+ */
+export class OpenAIEmbeddingProvider extends BaseEmbeddingProvider {
+    name = "openai";
+    private client: OpenAI | null = null;
+
+    constructor(config: EmbeddingConfig) {
+        super(config);
+        this.initClient();
+    }
+
+    /**
+     * Initialize the OpenAI client
+     */
+    private initClient() {
+        if (this.apiKey) {
+            this.client = new OpenAI({
+                apiKey: this.apiKey,
+                baseURL: this.baseUrl
+            });
+        }
+    }
+
+    /**
+     * Initialize the provider by detecting model capabilities
+     */
+    async initialize(): Promise<void> {
+        const modelName = this.config.model || "text-embedding-3-small";
+        try {
+            // Initialize client if needed
+            if (!this.client && this.apiKey) {
+                this.initClient();
+            }
+
+            // Detect model capabilities
+            const modelInfo = await this.getModelInfo(modelName);
+
+            // Update the config dimension
+            this.config.dimension = modelInfo.dimension;
+
+            log.info(`OpenAI model ${modelName} initialized with dimension ${this.config.dimension} and context window ${modelInfo.contextWidth}`);
+        } catch (error: any) {
+            log.error(`Error initializing OpenAI provider: ${error.message}`);
+        }
+    }
+
+    /**
+     * Fetch model information from the OpenAI API
+     */
+    private async fetchModelCapabilities(modelName: string): Promise<EmbeddingModelInfo | null> {
+        if (!this.client) {
+            return null;
+        }
+
+        try {
+            // Get model details using the SDK
+            const model = await this.client.models.retrieve(modelName);
+
+            if (model) {
+                // Different model families may have different ways of exposing context window
+                let contextWindow = 0;
+                let dimension = 0;
+
+                // Extract context window if available from the response
+                const modelData = model as any;
+
+                if (modelData.context_window) {
+                    contextWindow = modelData.context_window;
+                } else if (modelData.limits && modelData.limits.context_window) {
+                    contextWindow = modelData.limits.context_window;
+                } else if (modelData.limits && modelData.limits.context_length) {
+                    contextWindow = modelData.limits.context_length;
+                }
+
+                // Extract embedding dimensions if available
+                if (modelData.dimensions) {
+                    dimension = modelData.dimensions;
+                } else if (modelData.embedding_dimension) {
+                    dimension = modelData.embedding_dimension;
+                }
+
+                // If we didn't get all the info, use defaults for missing values
+                if (!contextWindow) {
+                    // Set contextWindow based on model name patterns
+                    if (modelName.includes('embedding-3')) {
+                        contextWindow = PROVIDER_EMBEDDING_CAPABILITIES.OPENAI.MODELS['text-embedding-3-small'].contextWindow;
+                    } else {
+                        contextWindow = PROVIDER_EMBEDDING_CAPABILITIES.OPENAI.MODELS.default.contextWindow;
+                    }
+                }
+
+                if (!dimension) {
+                    // Set default dimensions based on model name patterns
+                    if (modelName.includes('ada') || modelName.includes('embedding-ada')) {
+                        dimension = LLM_CONSTANTS.EMBEDDING_DIMENSIONS.OPENAI.ADA;
+                    } else if (modelName.includes('embedding-3-small')) {
+                        dimension = PROVIDER_EMBEDDING_CAPABILITIES.OPENAI.MODELS['text-embedding-3-small'].dimension;
+                    } else if (modelName.includes('embedding-3-large')) {
+                        dimension = PROVIDER_EMBEDDING_CAPABILITIES.OPENAI.MODELS['text-embedding-3-large'].dimension;
+                    } else {
+                        dimension = PROVIDER_EMBEDDING_CAPABILITIES.OPENAI.MODELS.default.dimension;
+                    }
+                }
+
+                log.info(`Fetched OpenAI model info for ${modelName}: context window ${contextWindow}, dimension ${dimension}`);
+
+                return {
+                    name: modelName,
+                    dimension,
+                    contextWidth: contextWindow,
+                    type: 'float32'
+                };
+            }
+        } catch (error: any) {
+            log.info(`Could not fetch model info from OpenAI API: ${error.message}. Will try embedding test.`);
+        }
+
+        return null;
+    }
+
+    /**
+     * Get model information including embedding dimensions
+     */
+    async getModelInfo(modelName: string): Promise<EmbeddingModelInfo> {
+        // Check cache first
+        if (this.modelInfoCache.has(modelName)) {
+            return this.modelInfoCache.get(modelName)!;
+        }
+
+        // Try to fetch model capabilities from API
+        const apiModelInfo = await this.fetchModelCapabilities(modelName);
+        if (apiModelInfo) {
+            // Cache and return the API-provided info
+            this.modelInfoCache.set(modelName, apiModelInfo);
+            this.config.dimension = apiModelInfo.dimension;
+            return apiModelInfo;
+        }
+
+        // If API info fetch fails, try to detect embedding dimension with a test call
+        try {
+            const testEmbedding = await this.generateEmbeddings("Test");
+            const dimension = testEmbedding.length;
+
+            // Use default context window
+            let contextWindow = PROVIDER_EMBEDDING_CAPABILITIES.OPENAI.MODELS.default.contextWindow;
+
+            const modelInfo: EmbeddingModelInfo = {
+                name: modelName,
+                dimension,
+                contextWidth: contextWindow,
+                type: 'float32'
+            };
+            this.modelInfoCache.set(modelName, modelInfo);
+            this.config.dimension = dimension;
+
+            log.info(`Detected OpenAI model ${modelName} with dimension ${dimension} (context: ${contextWindow})`);
+            return modelInfo;
+        } catch (error: any) {
+            // If detection fails, use defaults
+            const dimension = PROVIDER_EMBEDDING_CAPABILITIES.OPENAI.MODELS.default.dimension;
+            const contextWindow = PROVIDER_EMBEDDING_CAPABILITIES.OPENAI.MODELS.default.contextWindow;
+
+            log.info(`Using default parameters for OpenAI model ${modelName}: dimension ${dimension}, context ${contextWindow}`);
+
+            const modelInfo: EmbeddingModelInfo = {
+                name: modelName,
+                dimension,
+                contextWidth: contextWindow,
+                type: 'float32'
+            };
+            this.modelInfoCache.set(modelName, modelInfo);
+            this.config.dimension = dimension;
+
+            return modelInfo;
+        }
+    }
+
+    /**
+     * Generate embeddings for a single text
+     */
+    async generateEmbeddings(text: string): Promise<Float32Array> {
+        try {
+            if (!text.trim()) {
+                return new Float32Array(this.config.dimension);
+            }
+
+            if (!this.client) {
+                this.initClient();
+                if (!this.client) {
+                    throw new Error("OpenAI client initialization failed");
+                }
+            }
+
+            const response = await this.client.embeddings.create({
+                model: this.config.model || "text-embedding-3-small",
+                input: text,
+                encoding_format: "float"
+            });
+
+            if (response && response.data && response.data[0] && response.data[0].embedding) {
+                return new Float32Array(response.data[0].embedding);
+            } else {
+                throw new Error("Unexpected response structure from OpenAI API");
+            }
+        } catch (error: any) {
+            const errorMessage = error.message || "Unknown error";
+            log.error(`OpenAI embedding error: ${errorMessage}`);
+            throw new Error(`OpenAI embedding error: ${errorMessage}`);
+        }
+    }
+
+    /**
+     * More specific implementation of batch size error detection for OpenAI
+     */
+    protected isBatchSizeError(error: any): boolean {
+        const errorMessage = error?.message || '';
+        const openAIBatchSizeErrorPatterns = [
+            'batch size', 'too many inputs', 'context length exceeded',
+            'maximum context length', 'token limit', 'rate limit exceeded',
+            'tokens in the messages', 'reduce the length', 'too long'
+        ];
+
+        return openAIBatchSizeErrorPatterns.some(pattern =>
+            errorMessage.toLowerCase().includes(pattern.toLowerCase())
+        );
+    }
+
+    /**
+     * Custom implementation for batched OpenAI embeddings
+     */
+    async generateBatchEmbeddingsWithAPI(texts: string[]): Promise<Float32Array[]> {
+        if (texts.length === 0) {
+            return [];
+        }
+
+        if (!this.client) {
+            this.initClient();
+            if (!this.client) {
+                throw new Error("OpenAI client initialization failed");
+            }
+        }
+
+        const response = await this.client.embeddings.create({
+            model: this.config.model || "text-embedding-3-small",
+            input: texts,
+            encoding_format: "float"
+        });
+
+        if (response && response.data) {
+            // Sort the embeddings by index to ensure they match the input order
+            const sortedEmbeddings = response.data
+                .sort((a, b) => a.index - b.index)
+                .map(item => new Float32Array(item.embedding));
+
+            return sortedEmbeddings;
+        } else {
+            throw new Error("Unexpected response structure from OpenAI API");
+        }
+    }
+
+    /**
+     * Generate embeddings for multiple texts in a single batch
+     * OpenAI API supports batch embedding, so we implement a custom version
+     */
+    async generateBatchEmbeddings(texts: string[]): Promise<Float32Array[]> {
+        if (texts.length === 0) {
+            return [];
+        }
+
+        try {
+            return await this.processWithAdaptiveBatch(
+                texts,
+                async (batch) => {
+                    // Filter out empty texts and use the API batch functionality
+                    const filteredBatch = batch.filter(text => text.trim().length > 0);
+
+                    if (filteredBatch.length === 0) {
+                        // If all texts are empty after filtering, return empty embeddings
+                        return batch.map(() => new Float32Array(this.config.dimension));
+                    }
+
+                    if (filteredBatch.length === 1) {
+                        // If only one text, use the single embedding endpoint
+                        const embedding = await this.generateEmbeddings(filteredBatch[0]);
+                        return [embedding];
+                    }
+
+                    // Use the batch API endpoint
+                    return this.generateBatchEmbeddingsWithAPI(filteredBatch);
+                },
+                this.isBatchSizeError
+            );
+        }
+        catch (error: any) {
+            const errorMessage = error.message || "Unknown error";
+            log.error(`OpenAI batch embedding error: ${errorMessage}`);
+            throw new Error(`OpenAI batch embedding error: ${errorMessage}`);
+        }
+    }
+
+    /**
+     * Returns the normalization status for OpenAI embeddings
+     * OpenAI embeddings are guaranteed to be normalized to unit length
+     */
+    getNormalizationStatus(): NormalizationStatus {
+        return NormalizationStatus.GUARANTEED;
+    }
+}
diff --git a/src/services/llm/embeddings/providers/voyage.ts b/src/services/llm/embeddings/providers/voyage.ts
new file mode 100644
index 000000000..514e0f2f4
--- /dev/null
+++ b/src/services/llm/embeddings/providers/voyage.ts
@@ -0,0 +1,285 @@
+import log from "../../../log.js";
+import { BaseEmbeddingProvider } from "../base_embeddings.js";
+import type { EmbeddingConfig } from "../embeddings_interface.js";
+import { NormalizationStatus } from "../embeddings_interface.js";
+import { LLM_CONSTANTS } from "../../constants/provider_constants.js";
+import { PROVIDER_EMBEDDING_CAPABILITIES } from "../../constants/search_constants.js";
+import type { EmbeddingModelInfo } from "../../interfaces/embedding_interfaces.js";
+
+// Use constants from the central constants file
+const VOYAGE_MODEL_CONTEXT_WINDOWS = PROVIDER_EMBEDDING_CAPABILITIES.VOYAGE.MODELS;
+const VOYAGE_MODEL_DIMENSIONS = Object.entries(PROVIDER_EMBEDDING_CAPABILITIES.VOYAGE.MODELS).reduce((acc, [key, value]) => {
+    acc[key] = value.dimension;
+    return acc;
+}, {} as Record<string, number>);
+
+/**
+ * Voyage AI embedding provider implementation
+ */
+export class VoyageEmbeddingProvider extends BaseEmbeddingProvider {
+    name = "voyage";
+
+    constructor(config: EmbeddingConfig) {
+        super(config);
+
+        // Set default base URL if not provided
+        if (!this.baseUrl) {
+            this.baseUrl = "https://api.voyageai.com/v1";
+        }
+    }
+
+    /**
+     * Initialize the provider by detecting model capabilities
+     */
+    async initialize(): Promise<void> {
+        const modelName = this.config.model || "voyage-2";
+        try {
+            // Detect model capabilities
+            const modelInfo = await this.getModelInfo(modelName);
+
+            // Update the config dimension
+            this.config.dimension = modelInfo.dimension;
+
+            log.info(`Voyage AI model ${modelName} initialized with dimension ${this.config.dimension} and context window ${modelInfo.contextWidth}`);
+        } catch (error: any) {
+            log.error(`Error initializing Voyage AI provider: ${error.message}`);
+        }
+    }
+
+    /**
+     * Try to determine Voyage AI model capabilities
+     */
+    private async fetchModelCapabilities(modelName: string): Promise<EmbeddingModelInfo | null> {
+        try {
+            // Find the closest matching model
+            const modelMapKey = Object.keys(PROVIDER_EMBEDDING_CAPABILITIES.VOYAGE.MODELS).find(
+                model => modelName.startsWith(model)
+            ) || "default";
+
+            // Use as keyof to tell TypeScript this is a valid key
+            const modelInfo = PROVIDER_EMBEDDING_CAPABILITIES.VOYAGE.MODELS[modelMapKey as keyof typeof PROVIDER_EMBEDDING_CAPABILITIES.VOYAGE.MODELS];
+
+            return {
+                dimension: modelInfo.dimension,
+                contextWidth: modelInfo.contextWidth,
+                name: modelName,
+                type: 'float32'
+            };
+        } catch (error) {
+            log.info(`Could not determine capabilities for Voyage AI model ${modelName}: ${error}`);
+            return null;
+        }
+    }
+
+    /**
+     * Get model information including embedding dimensions
+     */
+    async getModelInfo(modelName: string): Promise<EmbeddingModelInfo> {
+        // Check cache first
+        if (this.modelInfoCache.has(modelName)) {
+            return this.modelInfoCache.get(modelName)!;
+        }
+
+        // Try to determine model capabilities
+        const capabilities = await this.fetchModelCapabilities(modelName);
+        const defaults = PROVIDER_EMBEDDING_CAPABILITIES.VOYAGE.MODELS.default;
+        const contextWindow = capabilities?.contextWidth || defaults.contextWidth;
+        const knownDimension = capabilities?.dimension || defaults.dimension;
+
+        // For Voyage, we can use known dimensions or detect with a test call
+        try {
+            if (knownDimension) {
+                // Use known dimension
+                const modelInfo: EmbeddingModelInfo = {
+                    dimension: knownDimension,
+                    contextWidth: contextWindow,
+                    name: modelName,
+                    type: 'float32'
+                };
+
+                this.modelInfoCache.set(modelName, modelInfo);
+                this.config.dimension = knownDimension;
+
+                log.info(`Using known parameters for Voyage AI model ${modelName}: dimension ${knownDimension}, context ${contextWindow}`);
+                return modelInfo;
+            } else {
+                // Detect dimension with a test embedding as fallback
+                const testEmbedding = await this.generateEmbeddings("Test");
+                const dimension = testEmbedding.length;
+
+                // Set model info based on the model name, detected dimension, and reasonable defaults
+                if (modelName.includes('voyage-2')) {
+                    return {
+                        dimension: dimension || 1024,
+                        contextWidth: 8192,
+                        name: modelName,
+                        type: 'float32'
+                    };
+                } else if (modelName.includes('voyage-lite-02')) {
+                    return {
+                        dimension: dimension || 768,
+                        contextWidth: 8192,
+                        name: modelName,
+                        type: 'float32'
+                    };
+                } else {
+                    // Default for other Voyage models
+                    return {
+                        dimension: dimension || 1024,
+                        contextWidth: 8192,
+                        name: modelName,
+                        type: 'float32'
+                    };
+                }
+            }
+        } catch (error: any) {
+            log.info(`Could not fetch model info from Voyage AI API: ${error.message}. Using defaults.`);
+
+            // Use default parameters if everything else fails
+            const defaultModelInfo: EmbeddingModelInfo = {
+                dimension: 1024, // Default for Voyage models
+                contextWidth: 8192,
+                name: modelName,
+                type: 'float32'
+            };
+
+            this.modelInfoCache.set(modelName, defaultModelInfo);
+            this.config.dimension = defaultModelInfo.dimension;
+            return defaultModelInfo;
+        }
+    }
+
+    /**
+     * Generate embeddings for a single text
+     */
+    async generateEmbeddings(text: string): Promise<Float32Array> {
+        try {
+            if (!text.trim()) {
+                return new Float32Array(this.config.dimension);
+            }
+
+            // Get model info to check context window
+            const modelName = this.config.model || "voyage-2";
+            const modelInfo = await this.getModelInfo(modelName);
+
+            // Trim text if it might exceed context window (rough character estimate)
+            const charLimit = (modelInfo.contextWidth || PROVIDER_EMBEDDING_CAPABILITIES.VOYAGE.MODELS.default.contextWidth) * 4; // Rough estimate: avg 4 chars per token
+            const trimmedText = text.length > charLimit ? text.substring(0, charLimit) : text;
+
+            const response = await fetch(`${this.baseUrl}/embeddings`, {
+                method: 'POST',
+                headers: {
+                    "Content-Type": "application/json",
+                    "Authorization": `Bearer ${this.apiKey}`
+                },
+                body: JSON.stringify({
+                    model: modelName,
+                    input: trimmedText,
+                    input_type: "text",
+                    truncation: true
+                })
+            });
+
+            if (!response.ok) {
+                const errorData = await response.json().catch(() => ({}));
+                throw new Error(errorData.error?.message || `HTTP error ${response.status}`);
+            }
+
+            const data = await response.json();
+            if (data && data.data && data.data[0] && data.data[0].embedding) {
+                return new Float32Array(data.data[0].embedding);
+            } else {
+                throw new Error("Unexpected response structure from Voyage AI API");
+            }
+        } catch (error: any) {
+            const errorMessage = error.message || "Unknown error";
+            log.error(`Voyage AI embedding error: ${errorMessage}`);
+            throw new Error(`Voyage AI embedding error: ${errorMessage}`);
+        }
+    }
+
+    /**
+     * More specific implementation of batch size error detection for Voyage AI
+     */
+    protected isBatchSizeError(error: any): boolean {
+        const errorMessage = error?.message || '';
+        const voyageBatchSizeErrorPatterns = [
+            'batch size', 'too many inputs', 'context length exceeded',
+            'token limit', 'rate limit', 'limit exceeded',
+            'too long', 'request too large', 'content too large'
+        ];
+
+        return voyageBatchSizeErrorPatterns.some(pattern =>
+            errorMessage.toLowerCase().includes(pattern.toLowerCase())
+        );
+    }
+
+    /**
+     * Generate embeddings for multiple texts in a single batch
+     */
+    async generateBatchEmbeddings(texts: string[]): Promise<Float32Array[]> {
+        if (texts.length === 0) {
+            return [];
+        }
+
+        try {
+            return await this.processWithAdaptiveBatch(
+                texts,
+                async (batch) => {
+                    if (batch.length === 0) return [];
+                    if (batch.length === 1) {
+                        return [await this.generateEmbeddings(batch[0])];
+                    }
+
+                    // For Voyage AI, we can batch embeddings
+                    const modelName = this.config.model || "voyage-2";
+
+                    // Filter out empty texts
+                    const validBatch = batch.map(text => text.trim() || " ");
+
+                    const response = await fetch(`${this.baseUrl}/embeddings`, {
+                        method: 'POST',
+                        headers: {
+                            "Content-Type": "application/json",
+                            "Authorization": `Bearer ${this.apiKey}`
+                        },
+                        body: JSON.stringify({
+                            model: modelName,
+                            input: validBatch,
+                            input_type: "text",
+                            truncation: true
+                        })
+                    });
+
+                    if (!response.ok) {
+                        const errorData = await response.json().catch(() => ({}));
+                        throw new Error(errorData.error?.message || `HTTP error ${response.status}`);
+                    }
+
+                    const data = await response.json();
+                    if (data && data.data && Array.isArray(data.data)) {
+                        return data.data.map((item: any) =>
+                            new Float32Array(item.embedding || [])
+                        );
+                    } else {
+                        throw new Error("Unexpected response structure from Voyage AI batch API");
+                    }
+                },
+                this.isBatchSizeError
+            );
+        }
+        catch (error: any) {
+            const errorMessage = error.message || "Unknown error";
+            log.error(`Voyage AI batch embedding error: ${errorMessage}`);
+            throw new Error(`Voyage AI batch embedding error: ${errorMessage}`);
+        }
+    }
+
+    /**
+     * Returns the normalization status for Voyage embeddings
+     * Voyage embeddings are generally normalized by the API
+     */
+    getNormalizationStatus(): NormalizationStatus {
+        return NormalizationStatus.GUARANTEED;
+    }
+}
diff --git a/src/services/llm/embeddings/queue.ts b/src/services/llm/embeddings/queue.ts
new file mode 100644
index 000000000..1b27559d1
--- /dev/null
+++ b/src/services/llm/embeddings/queue.ts
@@ -0,0 +1,373 @@
+import sql from "../../../services/sql.js";
+import dateUtils from "../../../services/date_utils.js";
+import log from "../../../services/log.js";
+import becca from "../../../becca/becca.js";
+import options from "../../../services/options.js";
+import { getEnabledEmbeddingProviders } from "../providers/providers.js";
+import { getNoteEmbeddingContext } from "./content_processing.js";
+import { deleteNoteEmbeddings } from "./storage.js";
+import type { QueueItem } from "./types.js";
+import { getChunkingOperations } from "./chunking/chunking_interface.js";
+import indexService from '../index_service.js';
+
+// Track which notes are currently being processed
+const notesInProcess = new Set<string>();
+
+/**
+ * Queues a note for embedding update
+ */
+export async function queueNoteForEmbedding(noteId: string, operation = 'UPDATE') {
+    const now = dateUtils.localNowDateTime();
+    const utcNow = dateUtils.utcNowDateTime();
+
+    try {
+        // Check if note is already in queue and whether it's marked as permanently failed
+        const queueInfo = await sql.getRow(
+            "SELECT 1 as exists_flag, failed, isProcessing FROM embedding_queue WHERE noteId = ?",
+            [noteId]
+        ) as {exists_flag: number, failed: number, isProcessing: number} | null;
+
+        if (queueInfo) {
+            // If the note is currently being processed, don't change its status
+            if (queueInfo.isProcessing === 1) {
+                log.info(`Note ${noteId} is currently being processed, skipping queue update`);
+                return;
+            }
+
+            // Only update if not permanently failed
+            if (queueInfo.failed !== 1) {
+                // Update existing queue entry but preserve the failed status
+                await sql.execute(`
+                    UPDATE embedding_queue
+                    SET operation = ?, dateQueued = ?, utcDateQueued = ?, attempts = 0, error = NULL
+                    WHERE noteId = ?`,
+                    [operation, now, utcNow, noteId]
+                );
+            } else {
+                // Note is marked as permanently failed, don't update
+                log.info(`Note ${noteId} is marked as permanently failed, skipping automatic re-queue`);
+            }
+        } else {
+            // Add new queue entry
+            await sql.execute(`
+                INSERT INTO embedding_queue
+                (noteId, operation, dateQueued, utcDateQueued, failed, isProcessing)
+                VALUES (?, ?, ?, ?, 0, 0)`,
+                [noteId, operation, now, utcNow]
+            );
+        }
+    } catch (error: any) {
+        // If there's a race condition where multiple events try to queue the same note simultaneously,
+        // one of them will succeed and others will fail with UNIQUE constraint violation.
+        // We can safely ignore this specific error since the note is already queued.
+        if (error.code === 'SQLITE_CONSTRAINT_PRIMARYKEY' && error.message.includes('UNIQUE constraint failed: embedding_queue.noteId')) {
+            log.info(`Note ${noteId} was already queued by another process, ignoring duplicate queue request`);
+            return;
+        }
+        // Rethrow any other errors
+        throw error;
+    }
+}
+
+/**
+ * Get notes that have failed embedding generation
+ *
+ * @param limit - Maximum number of failed notes to return
+ * @returns List of failed notes with their error information
+ */
+export async function getFailedEmbeddingNotes(limit: number = 100): Promise<any[]> {
+    // Get notes with failed embedding attempts or permanently failed flag
+    const failedQueueItems = await sql.getRows(`
+        SELECT noteId, operation, attempts, lastAttempt, error, failed
+        FROM embedding_queue
+        WHERE attempts > 0 OR failed = 1
+        ORDER BY failed DESC, attempts DESC, lastAttempt DESC
+        LIMIT ?`,
+        [limit]
+    ) as {noteId: string, operation: string, attempts: number, lastAttempt: string, error: string, failed: number}[];
+
+    // Add titles to the failed notes
+    const failedNotesWithTitles = [];
+    for (const item of failedQueueItems) {
+        const note = becca.getNote(item.noteId);
+        if (note) {
+            // Check if this is a chunking error (contains the word "chunks")
+            const isChunkFailure = item.error && item.error.toLowerCase().includes('chunk');
+            const isPermanentFailure = item.failed === 1;
+
+            failedNotesWithTitles.push({
+                ...item,
+                title: note.title,
+                failureType: isChunkFailure ? 'chunks' : 'full',
+                isPermanent: isPermanentFailure
+            });
+        } else {
+            failedNotesWithTitles.push({
+                ...item,
+                failureType: 'full',
+                isPermanent: item.failed === 1
+            });
+        }
+    }
+
+    // Sort by latest attempt
+    failedNotesWithTitles.sort((a, b) => {
+        if (a.lastAttempt && b.lastAttempt) {
+            return b.lastAttempt.localeCompare(a.lastAttempt);
+        }
+        return 0;
+    });
+
+    // Limit to the specified number
+    return failedNotesWithTitles.slice(0, limit);
+}
+
+/**
+ * Retry a specific failed note embedding
+ */
+export async function retryFailedEmbedding(noteId: string): Promise<boolean> {
+    const now = dateUtils.localNowDateTime();
+    const utcNow = dateUtils.utcNowDateTime();
+
+    // Check if the note is in the embedding queue and has failed or has attempts
+    const existsInQueue = await sql.getValue(
+        "SELECT 1 FROM embedding_queue WHERE noteId = ? AND (failed = 1 OR attempts > 0)",
+        [noteId]
+    );
+
+    if (existsInQueue) {
+        // Reset the note in the queue
+        await sql.execute(`
+            UPDATE embedding_queue
+            SET attempts = 0, error = NULL, failed = 0, dateQueued = ?, utcDateQueued = ?, priority = 10
+            WHERE noteId = ?`,
+            [now, utcNow, noteId]
+        );
+        return true;
+    }
+
+    return false;
+}
+
+/**
+ * Retry all failed embeddings
+ *
+ * @returns Number of notes queued for retry
+ */
+export async function retryAllFailedEmbeddings(): Promise<number> {
+    const now = dateUtils.localNowDateTime();
+    const utcNow = dateUtils.utcNowDateTime();
+
+    // Get count of all failed notes in queue (either with failed=1 or attempts>0)
+    const failedCount = await sql.getValue(
+        "SELECT COUNT(*) FROM embedding_queue WHERE failed = 1 OR attempts > 0"
+    ) as number;
+
+    if (failedCount > 0) {
+        // Reset all failed notes in the queue
+        await sql.execute(`
+            UPDATE embedding_queue
+            SET attempts = 0, error = NULL, failed = 0, dateQueued = ?, utcDateQueued = ?, priority = 10
+            WHERE failed = 1 OR attempts > 0`,
+            [now, utcNow]
+        );
+    }
+
+    return failedCount;
+}
+
+/**
+ * Process the embedding queue
+ */
+export async function processEmbeddingQueue() {
+    if (!(await options.getOptionBool('aiEnabled'))) {
+        return;
+    }
+
+    // Check if this instance should process embeddings
+    const embeddingLocation = await options.getOption('embeddingGenerationLocation') || 'client';
+    const isSyncServer = await indexService.isSyncServerForEmbeddings();
+    const shouldProcessEmbeddings = embeddingLocation === 'client' || isSyncServer;
+
+    if (!shouldProcessEmbeddings) {
+        // This instance is not configured to process embeddings
+        return;
+    }
+
+    const batchSize = parseInt(await options.getOption('embeddingBatchSize') || '10', 10);
+    const enabledProviders = await getEnabledEmbeddingProviders();
+
+    if (enabledProviders.length === 0) {
+        return;
+    }
+
+    // Get notes from queue (excluding failed ones and those being processed)
+    const notes = await sql.getRows(`
+        SELECT noteId, operation, attempts
+        FROM embedding_queue
+        WHERE failed = 0 AND isProcessing = 0
+        ORDER BY priority DESC, utcDateQueued ASC
+        LIMIT ?`,
+        [batchSize]
+    );
+
+    if (notes.length === 0) {
+        return;
+    }
+
+    // Track successfully processed notes count for progress reporting
+    let processedCount = 0;
+
+    for (const note of notes) {
+        const noteData = note as unknown as QueueItem;
+        const noteId = noteData.noteId;
+
+        // Double-check that this note isn't already being processed
+        if (notesInProcess.has(noteId)) {
+            //log.info(`Note ${noteId} is already being processed by another thread, skipping`);
+            continue;
+        }
+
+        try {
+            // Mark the note as being processed
+            notesInProcess.add(noteId);
+            await sql.execute(
+                "UPDATE embedding_queue SET isProcessing = 1 WHERE noteId = ?",
+                [noteId]
+            );
+
+            // Skip if note no longer exists
+            if (!becca.getNote(noteId)) {
+                await sql.execute(
+                    "DELETE FROM embedding_queue WHERE noteId = ?",
+                    [noteId]
+                );
+                await deleteNoteEmbeddings(noteId);
+                continue;
+            }
+
+            if (noteData.operation === 'DELETE') {
+                await deleteNoteEmbeddings(noteId);
+                await sql.execute(
+                    "DELETE FROM embedding_queue WHERE noteId = ?",
+                    [noteId]
+                );
+                continue;
+            }
+
+            // Log that we're starting to process this note
+            log.info(`Starting embedding generation for note ${noteId}`);
+
+            // Get note context for embedding
+            const context = await getNoteEmbeddingContext(noteId);
+
+            // Check if we should use chunking for large content
+            const useChunking = context.content.length > 5000;
+
+            // Track provider successes and failures
+            let allProvidersFailed = true;
+            let allProvidersSucceeded = true;
+
+            // Process with each enabled provider
+            for (const provider of enabledProviders) {
+                try {
+                    if (useChunking) {
+                        // Process large notes using chunking
+                        const chunkingOps = await getChunkingOperations();
+                        await chunkingOps.processNoteWithChunking(noteId, provider, context);
+                        allProvidersFailed = false;
+                    } else {
+                        // Standard approach: Generate a single embedding for the whole note
+                        const embedding = await provider.generateNoteEmbeddings(context);
+
+                        // Store embedding
+                        const config = provider.getConfig();
+                        await import('./storage.js').then(storage => {
+                            return storage.storeNoteEmbedding(
+                                noteId,
+                                provider.name,
+                                config.model,
+                                embedding
+                            );
+                        });
+
+                        // At least one provider succeeded
+                        allProvidersFailed = false;
+                    }
+                } catch (providerError: any) {
+                    // This provider failed
+                    allProvidersSucceeded = false;
+                    log.error(`Error generating embedding with provider ${provider.name} for note ${noteId}: ${providerError.message || 'Unknown error'}`);
+                }
+            }
+
+            if (!allProvidersFailed) {
+                // At least one provider succeeded, remove from queue
+                await sql.execute(
+                    "DELETE FROM embedding_queue WHERE noteId = ?",
+                    [noteId]
+                );
+                log.info(`Successfully completed embedding processing for note ${noteId}`);
+
+                // Count as successfully processed
+                processedCount++;
+            } else {
+                // If all providers failed, mark as failed but keep in queue
+                await sql.execute(`
+                    UPDATE embedding_queue
+                    SET attempts = attempts + 1,
+                        lastAttempt = ?,
+                        error = ?,
+                        isProcessing = 0
+                    WHERE noteId = ?`,
+                    [dateUtils.utcNowDateTime(), "All providers failed to generate embeddings", noteId]
+                );
+
+                // Mark as permanently failed if too many attempts
+                if (noteData.attempts + 1 >= 3) {
+                    log.error(`Marked note ${noteId} as permanently failed after multiple embedding attempts`);
+
+                    // Set the failed flag but keep the actual attempts count
+                    await sql.execute(`
+                        UPDATE embedding_queue
+                        SET failed = 1
+                        WHERE noteId = ?
+                    `, [noteId]);
+                }
+            }
+        } catch (error: any) {
+            // Update attempt count and log error
+            await sql.execute(`
+                UPDATE embedding_queue
+                SET attempts = attempts + 1,
+                    lastAttempt = ?,
+                    error = ?,
+                    isProcessing = 0
+                WHERE noteId = ?`,
+                [dateUtils.utcNowDateTime(), error.message || 'Unknown error', noteId]
+            );
+
+            log.error(`Error processing embedding for note ${noteId}: ${error.message || 'Unknown error'}`);
+
+            // Mark as permanently failed if too many attempts
+            if (noteData.attempts + 1 >= 3) {
+                log.error(`Marked note ${noteId} as permanently failed after multiple embedding attempts`);
+
+                // Set the failed flag but keep the actual attempts count
+                await sql.execute(`
+                    UPDATE embedding_queue
+                    SET failed = 1
+                    WHERE noteId = ?
+                `, [noteId]);
+            }
+        } finally {
+            // Always clean up the processing status in the in-memory set
+            notesInProcess.delete(noteId);
+        }
+    }
+
+    // Update the index rebuild progress if any notes were processed
+    if (processedCount > 0) {
+        indexService.updateIndexRebuildProgress(processedCount);
+    }
+}
diff --git a/src/services/llm/embeddings/stats.ts b/src/services/llm/embeddings/stats.ts
new file mode 100644
index 000000000..6154da368
--- /dev/null
+++ b/src/services/llm/embeddings/stats.ts
@@ -0,0 +1,88 @@
+import sql from "../../../services/sql.js";
+import log from "../../../services/log.js";
+import cls from "../../../services/cls.js";
+import { queueNoteForEmbedding } from "./queue.js";
+
+/**
+ * Reprocess all notes to update embeddings
+ */
+export async function reprocessAllNotes() {
+    log.info("Queueing all notes for embedding updates");
+
+    // Get all non-deleted note IDs
+    const noteIds = await sql.getColumn(
+        "SELECT noteId FROM notes WHERE isDeleted = 0"
+    );
+
+    log.info(`Adding ${noteIds.length} notes to embedding queue`);
+
+    // Process each note ID within a cls context
+    for (const noteId of noteIds) {
+        // Use cls.init to ensure proper context for each operation
+        await cls.init(async () => {
+            await queueNoteForEmbedding(noteId as string, 'UPDATE');
+        });
+    }
+}
+
+/**
+ * Get current embedding statistics
+ */
+export async function getEmbeddingStats() {
+    const totalNotesCount = await sql.getValue(
+        "SELECT COUNT(*) FROM notes WHERE isDeleted = 0"
+    ) as number;
+
+    const embeddedNotesCount = await sql.getValue(
+        "SELECT COUNT(DISTINCT noteId) FROM note_embeddings"
+    ) as number;
+
+    const queuedNotesCount = await sql.getValue(
+        "SELECT COUNT(*) FROM embedding_queue WHERE failed = 0"
+    ) as number;
+
+    const failedNotesCount = await sql.getValue(
+        "SELECT COUNT(*) FROM embedding_queue WHERE failed = 1"
+    ) as number;
+
+    // Get the last processing time by checking the most recent embedding
+    const lastProcessedDate = await sql.getValue(
+        "SELECT utcDateCreated FROM note_embeddings ORDER BY utcDateCreated DESC LIMIT 1"
+    ) as string | null || null;
+
+    // Calculate the actual completion percentage
+    // When reprocessing, we need to consider notes in the queue as not completed yet
+    // We calculate the percentage of notes that are embedded and NOT in the queue
+
+    // First, get the count of notes that are both in the embeddings table and queue
+    const notesInQueueWithEmbeddings = await sql.getValue(`
+        SELECT COUNT(DISTINCT eq.noteId)
+        FROM embedding_queue eq
+        JOIN note_embeddings ne ON eq.noteId = ne.noteId
+    `) as number;
+
+    // The number of notes with valid, up-to-date embeddings
+    const upToDateEmbeddings = embeddedNotesCount - notesInQueueWithEmbeddings;
+
+    // Calculate the percentage of notes that are properly embedded
+    const percentComplete = totalNotesCount > 0
+        ? Math.round((upToDateEmbeddings / (totalNotesCount - failedNotesCount)) * 100)
+        : 0;
+
+    return {
+        totalNotesCount,
+        embeddedNotesCount,
+        queuedNotesCount,
+        failedNotesCount,
+        lastProcessedDate,
+        percentComplete: Math.max(0, Math.min(100, percentComplete)) // Ensure between 0-100
+    };
+}
+
+/**
+ * Cleanup function to remove stale or unused embeddings
+ */
+export function cleanupEmbeddings() {
+    // Implementation can be added later when needed
+    // For example, removing embeddings for deleted notes, etc.
+}
diff --git a/src/services/llm/embeddings/storage.ts b/src/services/llm/embeddings/storage.ts
new file mode 100644
index 000000000..67063e63b
--- /dev/null
+++ b/src/services/llm/embeddings/storage.ts
@@ -0,0 +1,542 @@
+import sql from "../../sql.js";
+import { randomString } from "../../../services/utils.js";
+import dateUtils from "../../../services/date_utils.js";
+import log from "../../log.js";
+import { embeddingToBuffer, bufferToEmbedding, cosineSimilarity, enhancedCosineSimilarity, selectOptimalEmbedding, adaptEmbeddingDimensions } from "./vector_utils.js";
+import type { EmbeddingResult } from "./types.js";
+import entityChangesService from "../../../services/entity_changes.js";
+import type { EntityChange } from "../../../services/entity_changes_interface.js";
+import { EMBEDDING_CONSTANTS } from "../constants/embedding_constants.js";
+import { SEARCH_CONSTANTS } from '../constants/search_constants.js';
+/**
+ * Creates or updates an embedding for a note
+ */
+export async function storeNoteEmbedding(
+    noteId: string,
+    providerId: string,
+    modelId: string,
+    embedding: Float32Array
+): Promise<string> {
+    const dimension = embedding.length;
+    const embeddingBlob = embeddingToBuffer(embedding);
+    const now = dateUtils.localNowDateTime();
+    const utcNow = dateUtils.utcNowDateTime();
+
+    // Check if an embedding already exists for this note and provider/model
+    const existingEmbed = await getEmbeddingForNote(noteId, providerId, modelId);
+    let embedId;
+
+    if (existingEmbed) {
+        // Update existing embedding
+        embedId = existingEmbed.embedId;
+        await sql.execute(`
+            UPDATE note_embeddings
+            SET embedding = ?, dimension = ?, version = version + 1,
+                dateModified = ?, utcDateModified = ?
+            WHERE embedId = ?`,
+            [embeddingBlob, dimension, now, utcNow, embedId]
+        );
+    } else {
+        // Create new embedding
+        embedId = randomString(16);
+        await sql.execute(`
+            INSERT INTO note_embeddings
+            (embedId, noteId, providerId, modelId, dimension, embedding,
+             dateCreated, utcDateCreated, dateModified, utcDateModified)
+            VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?)`,
+            [embedId, noteId, providerId, modelId, dimension, embeddingBlob,
+             now, utcNow, now, utcNow]
+        );
+    }
+
+    // Create entity change record for syncing
+    interface EmbeddingRow {
+        embedId: string;
+        noteId: string;
+        providerId: string;
+        modelId: string;
+        dimension: number;
+        version: number;
+        dateCreated: string;
+        utcDateCreated: string;
+        dateModified: string;
+        utcDateModified: string;
+    }
+
+    const row = await sql.getRow<EmbeddingRow>(`
+        SELECT embedId, noteId, providerId, modelId, dimension, version,
+               dateCreated, utcDateCreated, dateModified, utcDateModified
+        FROM note_embeddings
+        WHERE embedId = ?`,
+        [embedId]
+    );
+
+    if (row) {
+        // Skip the actual embedding data for the hash since it's large
+        const ec: EntityChange = {
+            entityName: "note_embeddings",
+            entityId: embedId,
+            hash: `${row.noteId}|${row.providerId}|${row.modelId}|${row.dimension}|${row.version}|${row.utcDateModified}`,
+            utcDateChanged: row.utcDateModified,
+            isSynced: true,
+            isErased: false
+        };
+
+        entityChangesService.putEntityChange(ec);
+    }
+
+    return embedId;
+}
+
+/**
+ * Retrieves embedding for a specific note
+ */
+export async function getEmbeddingForNote(noteId: string, providerId: string, modelId: string): Promise<EmbeddingResult | null> {
+    const row = await sql.getRow(`
+        SELECT embedId, noteId, providerId, modelId, dimension, embedding, version,
+               dateCreated, utcDateCreated, dateModified, utcDateModified
+        FROM note_embeddings
+        WHERE noteId = ? AND providerId = ? AND modelId = ?`,
+        [noteId, providerId, modelId]
+    );
+
+    if (!row) {
+        return null;
+    }
+
+    // Need to cast row to any as it doesn't have type information
+    const rowData = row as any;
+
+    return {
+        ...rowData,
+        embedding: bufferToEmbedding(rowData.embedding, rowData.dimension)
+    };
+}
+
+// Create an interface that represents the embedding row from the database
+interface EmbeddingRow {
+    embedId: string;
+    noteId: string;
+    providerId: string;
+    modelId: string;
+    dimension: number;
+    embedding: Buffer;
+    title?: string;
+    type?: string;
+    mime?: string;
+    isDeleted?: number;
+}
+
+// Interface for enhanced embedding with query model information
+interface EnhancedEmbeddingRow extends EmbeddingRow {
+    queryProviderId: string;
+    queryModelId: string;
+}
+
+/**
+ * Finds similar notes based on vector similarity
+ */
+export async function findSimilarNotes(
+    embedding: Float32Array,
+    providerId: string,
+    modelId: string,
+    limit = SEARCH_CONSTANTS.VECTOR_SEARCH.DEFAULT_MAX_RESULTS,
+    threshold?: number,  // Made optional to use constants
+    useFallback = true   // Whether to try other providers if no embeddings found
+): Promise<{noteId: string, similarity: number, contentType?: string}[]> {
+    // Import constants dynamically to avoid circular dependencies
+    const llmModule = await import('../../../routes/api/llm.js');
+    // Use default threshold if not provided
+    const actualThreshold = threshold || SEARCH_CONSTANTS.VECTOR_SEARCH.EXACT_MATCH_THRESHOLD;
+
+    try {
+        log.info(`Finding similar notes with provider: ${providerId}, model: ${modelId}, dimension: ${embedding.length}, threshold: ${actualThreshold}`);
+
+        // First try to find embeddings for the exact provider and model
+        const embeddings = await sql.getRows(`
+            SELECT ne.embedId, ne.noteId, ne.providerId, ne.modelId, ne.dimension, ne.embedding,
+                 n.isDeleted, n.title, n.type, n.mime
+            FROM note_embeddings ne
+            JOIN notes n ON ne.noteId = n.noteId
+            WHERE ne.providerId = ? AND ne.modelId = ? AND n.isDeleted = 0
+        `, [providerId, modelId]) as EmbeddingRow[];
+
+        if (embeddings && embeddings.length > 0) {
+            log.info(`Found ${embeddings.length} embeddings for provider ${providerId}, model ${modelId}`);
+
+            // Add query model information to each embedding for cross-model comparison
+            const enhancedEmbeddings: EnhancedEmbeddingRow[] = embeddings.map(e => {
+                return {
+                    embedId: e.embedId,
+                    noteId: e.noteId,
+                    providerId: e.providerId,
+                    modelId: e.modelId,
+                    dimension: e.dimension,
+                    embedding: e.embedding,
+                    title: e.title,
+                    type: e.type,
+                    mime: e.mime,
+                    isDeleted: e.isDeleted,
+                    queryProviderId: providerId,
+                    queryModelId: modelId
+                };
+            });
+
+            return await processEmbeddings(embedding, enhancedEmbeddings, actualThreshold, limit);
+        }
+
+        // If no embeddings found and fallback is allowed, try other providers
+        if (useFallback) {
+            log.info(`No embeddings found for ${providerId}/${modelId}, trying fallback providers`);
+
+            // Define the type for embedding metadata
+            interface EmbeddingMetadata {
+                providerId: string;
+                modelId: string;
+                count: number;
+                dimension: number;
+            }
+
+            // Get all available embedding metadata
+            const availableEmbeddings = await sql.getRows(`
+                SELECT DISTINCT providerId, modelId, COUNT(*) as count, dimension
+                FROM note_embeddings
+                GROUP BY providerId, modelId
+                ORDER BY dimension DESC, count DESC
+            `) as EmbeddingMetadata[];
+
+            if (availableEmbeddings.length > 0) {
+                log.info(`Available embeddings: ${JSON.stringify(availableEmbeddings.map(e => ({
+                    providerId: e.providerId,
+                    modelId: e.modelId,
+                    count: e.count,
+                    dimension: e.dimension
+                })))}`);
+
+                // Import the vector utils
+                const { selectOptimalEmbedding } = await import('./vector_utils.js');
+
+                // Get user dimension strategy preference
+                const options = (await import('../../options.js')).default;
+                const dimensionStrategy = await options.getOption('embeddingDimensionStrategy') || 'native';
+                log.info(`Using embedding dimension strategy: ${dimensionStrategy}`);
+
+                // Find the best alternative based on highest dimension for 'native' strategy
+                if (dimensionStrategy === 'native') {
+                    const bestAlternative = selectOptimalEmbedding(availableEmbeddings);
+
+                    if (bestAlternative) {
+                        log.info(`Using highest-dimension fallback: ${bestAlternative.providerId}/${bestAlternative.modelId} (${bestAlternative.dimension}D)`);
+
+                        // Get embeddings for this provider/model
+                        const alternativeEmbeddings = await sql.getRows(`
+                            SELECT ne.embedId, ne.noteId, ne.providerId, ne.modelId, ne.dimension, ne.embedding,
+                                n.isDeleted, n.title, n.type, n.mime
+                            FROM note_embeddings ne
+                            JOIN notes n ON ne.noteId = n.noteId
+                            WHERE ne.providerId = ? AND ne.modelId = ? AND n.isDeleted = 0
+                        `, [bestAlternative.providerId, bestAlternative.modelId]) as EmbeddingRow[];
+
+                        if (alternativeEmbeddings && alternativeEmbeddings.length > 0) {
+                            // Add query model information to each embedding for cross-model comparison
+                            const enhancedEmbeddings: EnhancedEmbeddingRow[] = alternativeEmbeddings.map(e => {
+                                return {
+                                    embedId: e.embedId,
+                                    noteId: e.noteId,
+                                    providerId: e.providerId,
+                                    modelId: e.modelId,
+                                    dimension: e.dimension,
+                                    embedding: e.embedding,
+                                    title: e.title,
+                                    type: e.type,
+                                    mime: e.mime,
+                                    isDeleted: e.isDeleted,
+                                    queryProviderId: providerId,
+                                    queryModelId: modelId
+                                };
+                            });
+
+                            return await processEmbeddings(embedding, enhancedEmbeddings, actualThreshold, limit);
+                        }
+                    }
+                } else {
+                    // Use dedicated embedding provider precedence from options for other strategies
+                    let preferredProviders: string[] = [];
+                    const embeddingPrecedence = await options.getOption('embeddingProviderPrecedence');
+
+                    if (embeddingPrecedence) {
+                        // For "comma,separated,values"
+                        if (embeddingPrecedence.includes(',')) {
+                            preferredProviders = embeddingPrecedence.split(',').map(p => p.trim());
+                        }
+                        // For JSON array ["value1", "value2"]
+                        else if (embeddingPrecedence.startsWith('[') && embeddingPrecedence.endsWith(']')) {
+                            try {
+                                preferredProviders = JSON.parse(embeddingPrecedence);
+                            } catch (e) {
+                                log.error(`Error parsing embedding precedence: ${e}`);
+                                preferredProviders = [embeddingPrecedence]; // Fallback to using as single value
+                            }
+                        }
+                        // For a single value
+                        else {
+                            preferredProviders = [embeddingPrecedence];
+                        }
+                    }
+
+                    log.info(`Using provider precedence: ${preferredProviders.join(', ')}`);
+
+                    // Try providers in precedence order
+                    for (const provider of preferredProviders) {
+                        const providerEmbeddings = availableEmbeddings.filter(e => e.providerId === provider);
+
+                        if (providerEmbeddings.length > 0) {
+                            // Choose the model with the most embeddings
+                            const bestModel = providerEmbeddings.sort((a, b) => b.count - a.count)[0];
+                            log.info(`Found fallback provider: ${provider}, model: ${bestModel.modelId}, dimension: ${bestModel.dimension}`);
+
+                            // The 'regenerate' strategy would go here if needed
+                            // We're no longer supporting the 'adapt' strategy
+                        }
+                    }
+                }
+            }
+
+            log.info('No suitable fallback embeddings found, returning empty results');
+        }
+
+        return [];
+    } catch (error) {
+        log.error(`Error finding similar notes: ${error}`);
+        return [];
+    }
+}
+
+// Helper function to process embeddings and calculate similarities
+async function processEmbeddings(queryEmbedding: Float32Array, embeddings: any[], threshold: number, limit: number) {
+    const {
+        enhancedCosineSimilarity,
+        bufferToEmbedding,
+        ContentType,
+        PerformanceProfile,
+        detectContentType,
+        vectorDebugConfig
+    } = await import('./vector_utils.js');
+
+    // Store original debug settings but keep debug disabled
+    const originalDebugEnabled = vectorDebugConfig.enabled;
+    const originalLogLevel = vectorDebugConfig.logLevel;
+
+    // Keep debug disabled for normal operation
+    vectorDebugConfig.enabled = false;
+    vectorDebugConfig.recordStats = false;
+
+    const options = (await import('../../options.js')).default;
+
+    // Define weighting factors with defaults that can be overridden by settings
+    interface SimilarityWeights {
+        exactTitleMatch: number;
+        titleContainsQuery: number;
+        partialTitleMatch: number;
+        // Add more weights as needed - examples:
+        sameType?: number;
+        attributeMatch?: number;
+        recentlyCreated?: number;
+        recentlyModified?: number;
+    }
+
+    // Default weights that match our previous hardcoded values
+    const defaultWeights: SimilarityWeights = {
+        exactTitleMatch: 0.3,
+        titleContainsQuery: 0.2,
+        partialTitleMatch: 0.1,
+        sameType: 0.05,
+        attributeMatch: 0.05,
+        recentlyCreated: 0.05,
+        recentlyModified: 0.05
+    };
+
+    // Get weights from options if they exist
+    const weights: SimilarityWeights = { ...defaultWeights };
+    try {
+        const customWeightsJSON = EMBEDDING_CONSTANTS;
+        if (customWeightsJSON) {
+            try {
+                const customWeights = EMBEDDING_CONSTANTS;
+                // Override defaults with any custom weights
+                Object.assign(weights, customWeights);
+                log.info(`Using custom similarity weights: ${JSON.stringify(weights)}`);
+            } catch (e) {
+                log.error(`Error parsing custom similarity weights: ${e}`);
+            }
+        }
+    } catch (e) {
+        // Use defaults if no custom weights
+    }
+
+    /**
+     * Calculate similarity bonuses based on various factors
+     */
+    function calculateSimilarityBonuses(
+        embedding: any,
+        note: any,
+        queryText: string,
+        weights: SimilarityWeights
+    ): { bonuses: Record<string, number>, totalBonus: number } {
+        const bonuses: Record<string, number> = {};
+
+        // Skip if we don't have query text
+        if (!queryText || !note.title) {
+            return { bonuses, totalBonus: 0 };
+        }
+
+        const titleLower = note.title.toLowerCase();
+        const queryLower = queryText.toLowerCase();
+
+        // 1. Exact title match
+        if (titleLower === queryLower) {
+            bonuses.exactTitleMatch = weights.exactTitleMatch;
+        }
+        // 2. Title contains the entire query
+        else if (titleLower.includes(queryLower)) {
+            bonuses.titleContainsQuery = weights.titleContainsQuery;
+        }
+        // 3. Partial term matching
+        else {
+            // Split query into terms and check if title contains them
+            const queryTerms = queryLower.split(/\s+/).filter((term: string) => term.length > 2);
+            let matchCount = 0;
+
+            for (const term of queryTerms) {
+                if (titleLower.includes(term)) {
+                    matchCount++;
+                }
+            }
+
+            if (matchCount > 0 && queryTerms.length > 0) {
+                // Calculate proportion of matching terms and apply a scaled bonus
+                const matchProportion = matchCount / queryTerms.length;
+                bonuses.partialTitleMatch = weights.partialTitleMatch * matchProportion;
+            }
+        }
+
+        // 4. Add more factors as needed here
+        // Example: Same note type bonus
+        // if (note.type && weights.sameType) {
+        //     // Note: This would need to be compared with the query context to be meaningful
+        //     // For now, this is a placeholder for demonstration
+        //     bonuses.sameType = weights.sameType;
+        // }
+
+        // Calculate total bonus
+        const totalBonus = Object.values(bonuses).reduce((sum, bonus) => sum + bonus, 0);
+
+        return { bonuses, totalBonus };
+    }
+
+    const similarities = [];
+
+    try {
+        // Try to extract the original query text if it was added to the metadata
+        // This will help us determine title matches
+        const queryText = queryEmbedding.hasOwnProperty('originalQuery')
+            ? (queryEmbedding as any).originalQuery
+            : '';
+
+        for (const e of embeddings) {
+            const embVector = bufferToEmbedding(e.embedding, e.dimension);
+
+            // Detect content type from mime type if available
+            let contentType = ContentType.GENERAL_TEXT;
+            if (e.mime) {
+                contentType = detectContentType(e.mime);
+                // Debug logging removed to avoid console spam
+            }
+
+            // Select performance profile based on embedding size and use case
+            // For most similarity searches, BALANCED is a good default
+            const performanceProfile = PerformanceProfile.BALANCED;
+
+            // Determine if this is cross-model comparison
+            const isCrossModel = e.providerId !== e.queryProviderId || e.modelId !== e.queryModelId;
+
+            // Calculate similarity with content-aware parameters
+            let similarity = enhancedCosineSimilarity(
+                queryEmbedding,
+                embVector,
+                true, // normalize vectors to ensure consistent comparison
+                e.queryModelId,  // source model ID
+                e.modelId,       // target model ID
+                contentType,     // content-specific padding strategy
+                performanceProfile
+            );
+
+            // Calculate and apply similarity bonuses
+            const { bonuses, totalBonus } = calculateSimilarityBonuses(
+                queryEmbedding,
+                e,
+                queryText,
+                weights
+            );
+
+            if (totalBonus > 0) {
+                similarity += totalBonus;
+
+                // Log significant bonuses for debugging
+                const significantBonuses = Object.entries(bonuses)
+                    .filter(([_, value]) => value >= 0.05)
+                    .map(([key, value]) => `${key}: +${value.toFixed(2)}`)
+                    .join(', ');
+
+                if (significantBonuses) {
+                    log.info(`Added bonuses for note "${e.title}" (${e.noteId}): ${significantBonuses}`);
+                }
+
+                // Cap similarity at 1.0 to maintain expected range
+                similarity = Math.min(similarity, 1.0);
+            }
+
+            if (similarity >= threshold) {
+                similarities.push({
+                    noteId: e.noteId,
+                    similarity: similarity,
+                    contentType: contentType.toString(),
+                    // Optionally include bonuses for debugging/analysis
+                    // bonuses: bonuses
+                });
+            }
+        }
+
+        return similarities
+            .sort((a, b) => b.similarity - a.similarity)
+            .slice(0, limit);
+    } finally {
+        // Restore original debug settings
+        vectorDebugConfig.enabled = originalDebugEnabled;
+        vectorDebugConfig.logLevel = originalLogLevel;
+    }
+}
+
+/**
+ * Delete embeddings for a note
+ *
+ * @param noteId - The ID of the note
+ * @param providerId - Optional provider ID to delete embeddings only for a specific provider
+ * @param modelId - Optional model ID to delete embeddings only for a specific model
+ */
+export async function deleteNoteEmbeddings(noteId: string, providerId?: string, modelId?: string) {
+    let query = "DELETE FROM note_embeddings WHERE noteId = ?";
+    const params: any[] = [noteId];
+
+    if (providerId) {
+        query += " AND providerId = ?";
+        params.push(providerId);
+
+        if (modelId) {
+            query += " AND modelId = ?";
+            params.push(modelId);
+        }
+    }
+
+    await sql.execute(query, params);
+}
diff --git a/src/services/llm/embeddings/types.ts b/src/services/llm/embeddings/types.ts
new file mode 100644
index 000000000..49a79484e
--- /dev/null
+++ b/src/services/llm/embeddings/types.ts
@@ -0,0 +1,29 @@
+import type { NoteEmbeddingContext } from "./embeddings_interface.js";
+
+/**
+ * Type definition for embedding result
+ */
+export interface EmbeddingResult {
+    embedId: string;
+    noteId: string;
+    providerId: string;
+    modelId: string;
+    dimension: number;
+    embedding: Float32Array;
+    version: number;
+    dateCreated: string;
+    utcDateCreated: string;
+    dateModified: string;
+    utcDateModified: string;
+}
+
+/**
+ * Type for queue item
+ */
+export interface QueueItem {
+    noteId: string;
+    operation: string;
+    attempts: number;
+}
+
+export type { NoteEmbeddingContext };
diff --git a/src/services/llm/embeddings/vector_utils.ts b/src/services/llm/embeddings/vector_utils.ts
new file mode 100644
index 000000000..73037cfac
--- /dev/null
+++ b/src/services/llm/embeddings/vector_utils.ts
@@ -0,0 +1,886 @@
+import { SEARCH_CONSTANTS } from '../constants/search_constants.js';
+
+/**
+ * Computes the cosine similarity between two vectors
+ * If dimensions don't match, automatically adapts using the enhanced approach
+ * @param normalize Optional flag to normalize vectors before comparison (default: false)
+ * @param sourceModel Optional identifier for the source model
+ * @param targetModel Optional identifier for the target model
+ * @param contentType Optional content type for strategy selection
+ * @param performanceProfile Optional performance profile
+ */
+export function cosineSimilarity(
+    a: Float32Array,
+    b: Float32Array,
+    normalize: boolean = false,
+    sourceModel?: string,
+    targetModel?: string,
+    contentType?: ContentType,
+    performanceProfile?: PerformanceProfile
+): number {
+    // Use the enhanced approach that preserves more information
+    return enhancedCosineSimilarity(a, b, normalize, sourceModel, targetModel, contentType, performanceProfile);
+}
+
+/**
+ * Enhanced cosine similarity that adaptively handles different dimensions
+ * Instead of truncating larger embeddings, it pads smaller ones to preserve information
+ * @param normalize Optional flag to normalize vectors before comparison (default: false)
+ * @param sourceModel Optional identifier for the source model
+ * @param targetModel Optional identifier for the target model
+ * @param contentType Optional content type for strategy selection
+ * @param performanceProfile Optional performance profile
+ */
+export function enhancedCosineSimilarity(
+    a: Float32Array,
+    b: Float32Array,
+    normalize: boolean = false,
+    sourceModel?: string,
+    targetModel?: string,
+    contentType?: ContentType,
+    performanceProfile?: PerformanceProfile
+): number {
+    // If normalization is requested, normalize vectors first
+    if (normalize) {
+        a = normalizeVector(a);
+        b = normalizeVector(b);
+    }
+
+    // If dimensions match, use standard calculation
+    if (a.length === b.length) {
+        return standardCosineSimilarity(a, b);
+    }
+
+    // Log dimension adaptation
+    debugLog(`Dimension mismatch: ${a.length} vs ${b.length}. Adapting dimensions...`, 'info');
+
+    // Determine if models are different
+    const isCrossModelComparison = sourceModel !== targetModel &&
+                                  sourceModel !== undefined &&
+                                  targetModel !== undefined;
+
+    // Context for strategy selection
+    const context: StrategySelectionContext = {
+        contentType: contentType || ContentType.GENERAL_TEXT,
+        performanceProfile: performanceProfile || PerformanceProfile.BALANCED,
+        sourceDimension: a.length,
+        targetDimension: b.length,
+        sourceModel,
+        targetModel,
+        isCrossModelComparison
+    };
+
+    // Select the optimal strategy based on context
+    let adaptOptions: AdaptationOptions;
+
+    if (a.length > b.length) {
+        // Pad b to match a's dimensions
+        debugLog(`Adapting embedding B (${b.length}D) to match A (${a.length}D)`, 'debug');
+
+        // Get optimal strategy
+        adaptOptions = selectOptimalPaddingStrategy(context);
+        const adaptedB = adaptEmbeddingDimensions(b, a.length, adaptOptions);
+
+        // Record stats
+        recordAdaptationStats({
+            operation: 'dimension_adaptation',
+            sourceModel: targetModel,
+            targetModel: sourceModel,
+            sourceDimension: b.length,
+            targetDimension: a.length,
+            strategy: adaptOptions.strategy
+        });
+
+        return standardCosineSimilarity(a, adaptedB);
+    } else {
+        // Pad a to match b's dimensions
+        debugLog(`Adapting embedding A (${a.length}D) to match B (${b.length}D)`, 'debug');
+
+        // Get optimal strategy
+        adaptOptions = selectOptimalPaddingStrategy(context);
+        const adaptedA = adaptEmbeddingDimensions(a, b.length, adaptOptions);
+
+        // Record stats
+        recordAdaptationStats({
+            operation: 'dimension_adaptation',
+            sourceModel: sourceModel,
+            targetModel: targetModel,
+            sourceDimension: a.length,
+            targetDimension: b.length,
+            strategy: adaptOptions.strategy
+        });
+
+        return standardCosineSimilarity(adaptedA, b);
+    }
+}
+
+/**
+ * Normalizes a vector to unit length
+ * @param vector The vector to normalize
+ * @returns A new normalized vector
+ */
+export function normalizeVector(vector: Float32Array): Float32Array {
+    let magnitude = 0;
+    for (let i = 0; i < vector.length; i++) {
+        magnitude += vector[i] * vector[i];
+    }
+
+    magnitude = Math.sqrt(magnitude);
+
+    // If vector is already normalized or is a zero vector, return a copy
+    if (magnitude === 0 || Math.abs(magnitude - 1.0) < 1e-6) {
+        return new Float32Array(vector);
+    }
+
+    // Create a new normalized vector
+    const normalized = new Float32Array(vector.length);
+    for (let i = 0; i < vector.length; i++) {
+        normalized[i] = vector[i] / magnitude;
+    }
+
+    return normalized;
+}
+
+/**
+ * Standard cosine similarity for same-dimension vectors
+ */
+function standardCosineSimilarity(a: Float32Array, b: Float32Array): number {
+    let dotProduct = 0;
+    let aMagnitude = 0;
+    let bMagnitude = 0;
+
+    for (let i = 0; i < a.length; i++) {
+        dotProduct += a[i] * b[i];
+        aMagnitude += a[i] * a[i];
+        bMagnitude += b[i] * b[i];
+    }
+
+    aMagnitude = Math.sqrt(aMagnitude);
+    bMagnitude = Math.sqrt(bMagnitude);
+
+    if (aMagnitude === 0 || bMagnitude === 0) {
+        return 0;
+    }
+
+    return dotProduct / (aMagnitude * bMagnitude);
+}
+
+/**
+ * Identifies the optimal embedding when multiple are available
+ * Prioritizes higher-dimensional embeddings as they contain more information
+ */
+export function selectOptimalEmbedding(embeddings: Array<{
+    providerId: string;
+    modelId: string;
+    dimension: number;
+    count?: number;
+}>): {providerId: string; modelId: string; dimension: number} | null {
+    if (!embeddings || embeddings.length === 0) return null;
+
+    // First prioritize by dimension (higher is better)
+    let optimal = embeddings.reduce((best, current) =>
+        current.dimension > best.dimension ? current : best,
+        embeddings[0]
+    );
+
+    return optimal;
+}
+
+/**
+ * Padding strategy options for dimension adaptation
+ */
+export enum PaddingStrategy {
+    ZERO = 'zero',               // Simple zero padding (default)
+    MEAN = 'mean',               // Padding with mean value of source embedding
+    GAUSSIAN = 'gaussian',       // Padding with Gaussian noise based on source statistics
+    MIRROR = 'mirror'            // Mirroring existing values for padding
+}
+
+/**
+ * Configuration for embedding adaptation
+ */
+export interface AdaptationOptions {
+    strategy: PaddingStrategy;
+    seed?: number;               // Seed for random number generation (gaussian)
+    variance?: number;           // Variance for gaussian noise (default: 0.01)
+    normalize?: boolean;         // Whether to normalize after adaptation
+}
+
+/**
+ * Adapts an embedding to match target dimensions with configurable strategies
+ *
+ * @param sourceEmbedding The original embedding
+ * @param targetDimension The desired dimension
+ * @param options Configuration options for the adaptation
+ * @returns A new embedding with the target dimensions
+ */
+export function adaptEmbeddingDimensions(
+    sourceEmbedding: Float32Array,
+    targetDimension: number,
+    options: AdaptationOptions = { strategy: PaddingStrategy.ZERO, normalize: true }
+): Float32Array {
+    const sourceDimension = sourceEmbedding.length;
+
+    // If dimensions already match, return a copy of the original
+    if (sourceDimension === targetDimension) {
+        return new Float32Array(sourceEmbedding);
+    }
+
+    // Create a new embedding with target dimensions
+    const adaptedEmbedding = new Float32Array(targetDimension);
+
+    if (sourceDimension < targetDimension) {
+        // Copy all source values first
+        adaptedEmbedding.set(sourceEmbedding);
+
+        // Apply the selected padding strategy
+        switch (options.strategy) {
+            case PaddingStrategy.ZERO:
+                // Zero padding is already done by default
+                break;
+
+            case PaddingStrategy.MEAN:
+                // Calculate mean of source embedding
+                let sum = 0;
+                for (let i = 0; i < sourceDimension; i++) {
+                    sum += sourceEmbedding[i];
+                }
+                const mean = sum / sourceDimension;
+
+                // Fill remaining dimensions with mean value
+                for (let i = sourceDimension; i < targetDimension; i++) {
+                    adaptedEmbedding[i] = mean;
+                }
+                break;
+
+            case PaddingStrategy.GAUSSIAN:
+                // Calculate mean and standard deviation of source embedding
+                let meanSum = 0;
+                for (let i = 0; i < sourceDimension; i++) {
+                    meanSum += sourceEmbedding[i];
+                }
+                const meanValue = meanSum / sourceDimension;
+
+                let varianceSum = 0;
+                for (let i = 0; i < sourceDimension; i++) {
+                    varianceSum += Math.pow(sourceEmbedding[i] - meanValue, 2);
+                }
+                const variance = options.variance ?? Math.min(0.01, varianceSum / sourceDimension);
+                const stdDev = Math.sqrt(variance);
+
+                // Fill remaining dimensions with Gaussian noise
+                for (let i = sourceDimension; i < targetDimension; i++) {
+                    // Box-Muller transform for Gaussian distribution
+                    const u1 = Math.random();
+                    const u2 = Math.random();
+                    const z0 = Math.sqrt(-2.0 * Math.log(u1)) * Math.cos(2.0 * Math.PI * u2);
+
+                    adaptedEmbedding[i] = meanValue + stdDev * z0;
+                }
+                break;
+
+            case PaddingStrategy.MIRROR:
+                // Mirror existing values for padding
+                for (let i = sourceDimension; i < targetDimension; i++) {
+                    // Cycle through source values in reverse order
+                    const mirrorIndex = sourceDimension - 1 - ((i - sourceDimension) % sourceDimension);
+                    adaptedEmbedding[i] = sourceEmbedding[mirrorIndex];
+                }
+                break;
+
+            default:
+                // Default to zero padding
+                break;
+        }
+    } else {
+        // If source is larger, truncate to target dimension
+        for (let i = 0; i < targetDimension; i++) {
+            adaptedEmbedding[i] = sourceEmbedding[i];
+        }
+    }
+
+    // Normalize the adapted embedding if requested
+    if (options.normalize) {
+        return normalizeVector(adaptedEmbedding);
+    }
+
+    return adaptedEmbedding;
+}
+
+/**
+ * Converts embedding Float32Array to Buffer for storage in SQLite
+ */
+export function embeddingToBuffer(embedding: Float32Array): Buffer {
+    return Buffer.from(embedding.buffer);
+}
+
+/**
+ * Converts Buffer from SQLite back to Float32Array
+ */
+export function bufferToEmbedding(buffer: Buffer, dimension: number): Float32Array {
+    return new Float32Array(buffer.buffer, buffer.byteOffset, dimension);
+}
+
+/**
+ * Similarity metric options
+ */
+export enum SimilarityMetric {
+    COSINE = 'cosine',               // Standard cosine similarity
+    DOT_PRODUCT = 'dot_product',     // Simple dot product (assumes normalized vectors)
+    HYBRID = 'hybrid',               // Dot product + cosine hybrid
+    DIM_AWARE = 'dimension_aware',   // Dimension-aware similarity that factors in dimension differences
+    ENSEMBLE = 'ensemble'            // Combined score from multiple metrics
+}
+
+/**
+ * Configuration for similarity calculation
+ */
+export interface SimilarityOptions {
+    metric: SimilarityMetric;
+    normalize?: boolean;
+    ensembleWeights?: {[key in SimilarityMetric]?: number};
+    dimensionPenalty?: number; // Penalty factor for dimension differences (0 to 1)
+    sourceModel?: string;      // Source model identifier
+    targetModel?: string;      // Target model identifier
+    contentType?: ContentType; // Type of content being compared
+    performanceProfile?: PerformanceProfile; // Performance requirements
+}
+
+/**
+ * Computes similarity between two vectors using the specified metric
+ * @param a First vector
+ * @param b Second vector
+ * @param options Similarity calculation options
+ */
+export function computeSimilarity(
+    a: Float32Array,
+    b: Float32Array,
+    options: SimilarityOptions = { metric: SimilarityMetric.COSINE }
+): number {
+    // Apply normalization if requested
+    const normalize = options.normalize ?? false;
+
+    switch (options.metric) {
+        case SimilarityMetric.COSINE:
+            return cosineSimilarity(
+                a, b, normalize,
+                options.sourceModel, options.targetModel,
+                options.contentType, options.performanceProfile
+            );
+
+        case SimilarityMetric.DOT_PRODUCT:
+            // Dot product assumes normalized vectors for proper similarity measurement
+            const aNorm = normalize ? normalizeVector(a) : a;
+            const bNorm = normalize ? normalizeVector(b) : b;
+            return computeDotProduct(aNorm, bNorm, options);
+
+        case SimilarityMetric.HYBRID:
+            // Hybrid approach combines dot product with cosine similarity
+            // More robust against small perturbations while maintaining angle sensitivity
+            return hybridSimilarity(a, b, normalize, options);
+
+        case SimilarityMetric.DIM_AWARE:
+            // Dimension-aware similarity that factors in dimension differences
+            return dimensionAwareSimilarity(
+                a, b, normalize,
+                options.dimensionPenalty ?? 0.1,
+                options.contentType,
+                options.performanceProfile
+            );
+
+        case SimilarityMetric.ENSEMBLE:
+            // Ensemble scoring combines multiple metrics with weights
+            return ensembleSimilarity(a, b, options);
+
+        default:
+            // Default to cosine similarity
+            return cosineSimilarity(
+                a, b, normalize,
+                options.sourceModel, options.targetModel,
+                options.contentType, options.performanceProfile
+            );
+    }
+}
+
+/**
+ * Computes dot product between two vectors
+ */
+export function computeDotProduct(
+    a: Float32Array,
+    b: Float32Array,
+    options?: Pick<SimilarityOptions, 'contentType' | 'performanceProfile' | 'sourceModel' | 'targetModel'>
+): number {
+    // Adapt dimensions if needed
+    if (a.length !== b.length) {
+        // Create context for strategy selection if dimensions don't match
+        if (options) {
+            const context: StrategySelectionContext = {
+                contentType: options.contentType || ContentType.GENERAL_TEXT,
+                performanceProfile: options.performanceProfile || PerformanceProfile.BALANCED,
+                sourceDimension: a.length,
+                targetDimension: b.length,
+                sourceModel: options.sourceModel,
+                targetModel: options.targetModel,
+                isCrossModelComparison: options.sourceModel !== options.targetModel &&
+                                      options.sourceModel !== undefined &&
+                                      options.targetModel !== undefined
+            };
+
+            if (a.length > b.length) {
+                const adaptOptions = selectOptimalPaddingStrategy(context);
+                b = adaptEmbeddingDimensions(b, a.length, adaptOptions);
+            } else {
+                const adaptOptions = selectOptimalPaddingStrategy(context);
+                a = adaptEmbeddingDimensions(a, b.length, adaptOptions);
+            }
+        } else {
+            // Default behavior without options
+            if (a.length > b.length) {
+                b = adaptEmbeddingDimensions(b, a.length);
+            } else {
+                a = adaptEmbeddingDimensions(a, b.length);
+            }
+        }
+    }
+
+    let dotProduct = 0;
+    for (let i = 0; i < a.length; i++) {
+        dotProduct += a[i] * b[i];
+    }
+
+    return dotProduct;
+}
+
+/**
+ * Hybrid similarity combines dot product and cosine similarity
+ * Provides robustness against small perturbations while maintaining angle sensitivity
+ */
+export function hybridSimilarity(
+    a: Float32Array,
+    b: Float32Array,
+    normalize: boolean = false,
+    options?: Pick<SimilarityOptions, 'contentType' | 'performanceProfile' | 'sourceModel' | 'targetModel'>
+): number {
+    // Get cosine similarity with full options
+    const cosine = cosineSimilarity(
+        a, b, normalize,
+        options?.sourceModel, options?.targetModel,
+        options?.contentType, options?.performanceProfile
+    );
+
+    // For dot product, we should always normalize
+    const aNorm = normalize ? a : normalizeVector(a);
+    const bNorm = normalize ? b : normalizeVector(b);
+
+    // If dimensions don't match, adapt with optimal strategy
+    let adaptedA = aNorm;
+    let adaptedB = bNorm;
+
+    if (aNorm.length !== bNorm.length) {
+        // Use optimal padding strategy
+        if (options) {
+            const context: StrategySelectionContext = {
+                contentType: options.contentType || ContentType.GENERAL_TEXT,
+                performanceProfile: options.performanceProfile || PerformanceProfile.BALANCED,
+                sourceDimension: aNorm.length,
+                targetDimension: bNorm.length,
+                sourceModel: options.sourceModel,
+                targetModel: options.targetModel,
+                isCrossModelComparison: options.sourceModel !== options.targetModel &&
+                                      options.sourceModel !== undefined &&
+                                      options.targetModel !== undefined
+            };
+
+            if (aNorm.length < bNorm.length) {
+                const adaptOptions = selectOptimalPaddingStrategy(context);
+                adaptedA = adaptEmbeddingDimensions(aNorm, bNorm.length, adaptOptions);
+            } else {
+                const adaptOptions = selectOptimalPaddingStrategy(context);
+                adaptedB = adaptEmbeddingDimensions(bNorm, aNorm.length, adaptOptions);
+            }
+        } else {
+            // Default behavior
+            adaptedA = aNorm.length < bNorm.length ? adaptEmbeddingDimensions(aNorm, bNorm.length) : aNorm;
+            adaptedB = bNorm.length < aNorm.length ? adaptEmbeddingDimensions(bNorm, aNorm.length) : bNorm;
+        }
+    }
+
+    // Compute dot product (should be similar to cosine for normalized vectors)
+    const dot = computeDotProduct(adaptedA, adaptedB, options);
+
+    // Return weighted average - giving more weight to cosine
+    return 0.7 * cosine + 0.3 * dot;
+}
+
+/**
+ * Dimension-aware similarity that factors in dimension differences
+ * @param dimensionPenalty Penalty factor for dimension differences (0 to 1)
+ */
+export function dimensionAwareSimilarity(
+    a: Float32Array,
+    b: Float32Array,
+    normalize: boolean = false,
+    dimensionPenalty: number = 0.1,
+    contentType?: ContentType,
+    performanceProfile?: PerformanceProfile
+): number {
+    // Basic cosine similarity with content type information
+    const cosine = cosineSimilarity(a, b, normalize, undefined, undefined, contentType, performanceProfile);
+
+    // If dimensions match, return standard cosine
+    if (a.length === b.length) {
+        return cosine;
+    }
+
+    // Calculate dimension penalty
+    // This penalizes vectors with very different dimensions
+    const dimRatio = Math.min(a.length, b.length) / Math.max(a.length, b.length);
+    const penalty = 1 - dimensionPenalty * (1 - dimRatio);
+
+    // Apply penalty to similarity score
+    return cosine * penalty;
+}
+
+/**
+ * Ensemble similarity combines multiple metrics with weights
+ */
+export function ensembleSimilarity(
+    a: Float32Array,
+    b: Float32Array,
+    options: SimilarityOptions
+): number {
+    // Default weights if not provided
+    const weights = options.ensembleWeights ?? {
+        [SimilarityMetric.COSINE]: SEARCH_CONSTANTS.VECTOR_SEARCH.SIMILARITY_THRESHOLD.COSINE,
+        [SimilarityMetric.HYBRID]: SEARCH_CONSTANTS.VECTOR_SEARCH.SIMILARITY_THRESHOLD.HYBRID,
+        [SimilarityMetric.DIM_AWARE]: SEARCH_CONSTANTS.VECTOR_SEARCH.SIMILARITY_THRESHOLD.DIM_AWARE
+    };
+
+    let totalWeight = 0;
+    let weightedSum = 0;
+
+    // Compute each metric and apply weight
+    for (const [metricStr, weight] of Object.entries(weights)) {
+        const metric = metricStr as SimilarityMetric;
+        if (weight && weight > 0) {
+            // Skip the ensemble itself to avoid recursion
+            if (metric !== SimilarityMetric.ENSEMBLE) {
+                const similarity = computeSimilarity(a, b, {
+                    metric,
+                    normalize: options.normalize
+                });
+
+                weightedSum += similarity * weight;
+                totalWeight += weight;
+            }
+        }
+    }
+
+    // Normalize by total weight
+    return totalWeight > 0 ? weightedSum / totalWeight : cosineSimilarity(a, b, options.normalize);
+}
+
+/**
+ * Debug configuration for vector operations
+ */
+export interface DebugConfig {
+    enabled: boolean;
+    logLevel: 'info' | 'debug' | 'warning' | 'error';
+    recordStats: boolean;
+}
+
+/**
+ * Global debug configuration, can be modified at runtime
+ */
+export const vectorDebugConfig: DebugConfig = {
+    enabled: false,
+    logLevel: 'info',
+    recordStats: false
+};
+
+/**
+ * Statistics collected during vector operations
+ */
+export interface AdaptationStats {
+    timestamp: number;
+    operation: string;
+    sourceModel?: string;
+    targetModel?: string;
+    sourceDimension: number;
+    targetDimension: number;
+    strategy: string;
+    similarity?: number;
+}
+
+// Collection of adaptation statistics for quality auditing
+export const adaptationStats: AdaptationStats[] = [];
+
+/**
+ * Log a message if debugging is enabled
+ */
+function debugLog(
+    message: string,
+    level: 'info' | 'debug' | 'warning' | 'error' = 'info'
+): void {
+    if (vectorDebugConfig.enabled) {
+        const levelOrder = { 'debug': 0, 'info': 1, 'warning': 2, 'error': 3 };
+
+        if (levelOrder[level] >= levelOrder[vectorDebugConfig.logLevel]) {
+            const prefix = `[VectorUtils:${level.toUpperCase()}]`;
+
+            switch (level) {
+                case 'error':
+                    console.error(prefix, message);
+                    break;
+                case 'warning':
+                    console.warn(prefix, message);
+                    break;
+                case 'debug':
+                    console.debug(prefix, message);
+                    break;
+                default:
+                    console.log(prefix, message);
+            }
+        }
+    }
+}
+
+/**
+ * Record adaptation statistics if enabled
+ */
+function recordAdaptationStats(stats: Omit<AdaptationStats, 'timestamp'>): void {
+    if (vectorDebugConfig.enabled && vectorDebugConfig.recordStats) {
+        adaptationStats.push({
+            ...stats,
+            timestamp: Date.now()
+        });
+
+        // Keep only the last 1000 stats to prevent memory issues
+        if (adaptationStats.length > 1000) {
+            adaptationStats.shift();
+        }
+    }
+}
+
+/**
+ * Content types for embedding adaptation strategy selection
+ */
+export enum ContentType {
+    GENERAL_TEXT = 'general_text',
+    CODE = 'code',
+    STRUCTURED_DATA = 'structured_data',
+    MATHEMATICAL = 'mathematical',
+    MIXED = 'mixed'
+}
+
+/**
+ * Performance profile for selecting adaptation strategy
+ */
+export enum PerformanceProfile {
+    MAXIMUM_QUALITY = 'maximum_quality',   // Prioritize similarity quality over speed
+    BALANCED = 'balanced',                 // Balance quality and performance
+    MAXIMUM_SPEED = 'maximum_speed'        // Prioritize speed over quality
+}
+
+/**
+ * Context for selecting the optimal padding strategy
+ */
+export interface StrategySelectionContext {
+    contentType?: ContentType;                 // Type of content being compared
+    performanceProfile?: PerformanceProfile;   // Performance requirements
+    sourceDimension: number;                   // Source embedding dimension
+    targetDimension: number;                   // Target embedding dimension
+    sourceModel?: string;                      // Source model identifier
+    targetModel?: string;                      // Target model identifier
+    isHighPrecisionRequired?: boolean;         // Whether high precision is needed
+    isCrossModelComparison?: boolean;          // Whether comparing across different models
+    dimensionRatio?: number;                   // Custom dimension ratio threshold
+}
+
+/**
+ * Selects the optimal padding strategy based on content type and performance considerations
+ * @param context Selection context parameters
+ * @returns The most appropriate padding strategy and options
+ */
+export function selectOptimalPaddingStrategy(
+    context: StrategySelectionContext
+): AdaptationOptions {
+    const {
+        contentType = ContentType.GENERAL_TEXT,
+        performanceProfile = PerformanceProfile.BALANCED,
+        sourceDimension,
+        targetDimension,
+        isHighPrecisionRequired = false,
+        isCrossModelComparison = false
+    } = context;
+
+    // Calculate dimension ratio
+    const dimRatio = Math.min(sourceDimension, targetDimension) /
+                     Math.max(sourceDimension, targetDimension);
+
+    // Default options
+    const options: AdaptationOptions = {
+        strategy: PaddingStrategy.ZERO,
+        normalize: true
+    };
+
+    // Significant dimension difference detection
+    const hasSignificantDimDifference = dimRatio < (context.dimensionRatio || 0.5);
+
+    // Select strategy based on content type
+    switch (contentType) {
+        case ContentType.CODE:
+            // Code benefits from structural patterns
+            options.strategy = PaddingStrategy.MIRROR;
+            break;
+
+        case ContentType.STRUCTURED_DATA:
+            // Structured data works well with mean-value padding
+            options.strategy = PaddingStrategy.MEAN;
+            break;
+
+        case ContentType.MATHEMATICAL:
+            // Mathematical content benefits from gaussian noise to maintain statistical properties
+            options.strategy = PaddingStrategy.GAUSSIAN;
+            options.variance = 0.005; // Lower variance for mathematical precision
+            break;
+
+        case ContentType.MIXED:
+            // For mixed content, choose based on performance profile
+            if (performanceProfile === PerformanceProfile.MAXIMUM_QUALITY) {
+                options.strategy = PaddingStrategy.GAUSSIAN;
+            } else if (performanceProfile === PerformanceProfile.MAXIMUM_SPEED) {
+                options.strategy = PaddingStrategy.ZERO;
+            } else {
+                options.strategy = PaddingStrategy.MEAN;
+            }
+            break;
+
+        case ContentType.GENERAL_TEXT:
+        default:
+            // For general text, base decision on other factors
+            if (isHighPrecisionRequired) {
+                options.strategy = PaddingStrategy.GAUSSIAN;
+            } else if (isCrossModelComparison) {
+                options.strategy = PaddingStrategy.MEAN;
+            } else {
+                options.strategy = PaddingStrategy.ZERO;
+            }
+            break;
+    }
+
+    // Override based on performance profile if we have significant dimension differences
+    if (hasSignificantDimDifference) {
+        // For extreme dimension differences, specialized handling
+        if (performanceProfile === PerformanceProfile.MAXIMUM_QUALITY) {
+            // For quality, use gaussian noise for better statistical matching
+            options.strategy = PaddingStrategy.GAUSSIAN;
+            // Adjust variance based on dimension ratio
+            options.variance = Math.min(0.01, 0.02 * dimRatio);
+
+            // Log the significant dimension adaptation
+            debugLog(`Significant dimension difference detected: ${sourceDimension} vs ${targetDimension}. ` +
+                     `Ratio: ${dimRatio.toFixed(2)}. Using Gaussian strategy.`, 'warning');
+        } else if (performanceProfile === PerformanceProfile.MAXIMUM_SPEED) {
+            // For speed, stick with zero padding
+            options.strategy = PaddingStrategy.ZERO;
+        }
+    }
+
+    // Always use zero padding for trivial dimension differences
+    // (e.g. 1536 vs 1537) for performance reasons
+    if (Math.abs(sourceDimension - targetDimension) <= 5) {
+        options.strategy = PaddingStrategy.ZERO;
+    }
+
+    // Log the selected strategy
+    debugLog(`Selected padding strategy: ${options.strategy} for ` +
+             `content type: ${contentType}, performance profile: ${performanceProfile}`, 'debug');
+
+    return options;
+}
+
+/**
+ * Helper function to determine content type from note context
+ * @param context The note context information
+ * @returns The detected content type
+ */
+export function detectContentType(mime: string, content?: string): ContentType {
+    // Detect based on mime type
+    if (mime.includes('code') ||
+        mime.includes('javascript') ||
+        mime.includes('typescript') ||
+        mime.includes('python') ||
+        mime.includes('java') ||
+        mime.includes('c++') ||
+        mime.includes('json')) {
+        return ContentType.CODE;
+    }
+
+    if (mime.includes('xml') ||
+        mime.includes('csv') ||
+        mime.includes('sql') ||
+        mime.endsWith('+json')) {
+        return ContentType.STRUCTURED_DATA;
+    }
+
+    if (mime.includes('latex') ||
+        mime.includes('mathml') ||
+        mime.includes('tex')) {
+        return ContentType.MATHEMATICAL;
+    }
+
+    // If we have content, we can do deeper analysis
+    if (content) {
+        // Detect code by looking for common patterns
+        const codePatterns = [
+            /function\s+\w+\s*\(.*\)\s*{/,  // JavaScript/TypeScript function
+            /def\s+\w+\s*\(.*\):/,          // Python function
+            /class\s+\w+(\s+extends\s+\w+)?(\s+implements\s+\w+)?\s*{/, // Java/TypeScript class
+            /import\s+.*\s+from\s+['"]/,    // JS/TS import
+            /^\s*```\w+/m                    // Markdown code block
+        ];
+
+        if (codePatterns.some(pattern => pattern.test(content))) {
+            return ContentType.CODE;
+        }
+
+        // Detect structured data
+        const structuredPatterns = [
+            /^\s*[{\[]/,                     // JSON-like start
+            /^\s*<\?xml/,                    // XML declaration
+            /^\s*<[a-z]+>/i,                 // HTML/XML tag
+            /^\s*(\w+,)+\w+$/m,              // CSV-like
+            /CREATE\s+TABLE|SELECT\s+.*\s+FROM/i  // SQL
+        ];
+
+        if (structuredPatterns.some(pattern => pattern.test(content))) {
+            return ContentType.STRUCTURED_DATA;
+        }
+
+        // Detect mathematical content
+        const mathPatterns = [
+            /\$\$.*\$\$/s,                   // LaTeX block
+            /\\begin{equation}/,             // LaTeX equation environment
+            /\\sum|\\int|\\frac|\\sqrt/,     // Common LaTeX math commands
+        ];
+
+        if (mathPatterns.some(pattern => pattern.test(content))) {
+            return ContentType.MATHEMATICAL;
+        }
+
+        // Check for mixed content
+        const hasMixedContent =
+            (codePatterns.some(pattern => pattern.test(content)) &&
+             content.split(/\s+/).length > 100) || // Code and substantial text
+            (content.includes('```') &&
+             content.replace(/```.*?```/gs, '').length > 200); // Markdown with code blocks and text
+
+        if (hasMixedContent) {
+            return ContentType.MIXED;
+        }
+    }
+
+    // Default to general text
+    return ContentType.GENERAL_TEXT;
+}
diff --git a/src/services/llm/formatters/base_formatter.ts b/src/services/llm/formatters/base_formatter.ts
new file mode 100644
index 000000000..fe4c97f42
--- /dev/null
+++ b/src/services/llm/formatters/base_formatter.ts
@@ -0,0 +1,131 @@
+import sanitizeHtml from 'sanitize-html';
+import type { Message } from '../ai_interface.js';
+import type { MessageFormatter } from '../interfaces/message_formatter.js';
+import { DEFAULT_SYSTEM_PROMPT, PROVIDER_PROMPTS } from '../constants/llm_prompt_constants.js';
+import {
+    HTML_ALLOWED_TAGS,
+    HTML_ALLOWED_ATTRIBUTES,
+    HTML_TRANSFORMS,
+    HTML_TO_MARKDOWN_PATTERNS,
+    HTML_ENTITY_REPLACEMENTS,
+    ENCODING_FIXES,
+    FORMATTER_LOGS
+} from '../constants/formatter_constants.js';
+
+/**
+ * Base formatter with common functionality for all providers
+ * Provider-specific formatters should extend this class
+ */
+export abstract class BaseMessageFormatter implements MessageFormatter {
+    /**
+     * Format messages for the LLM API
+     * Each provider should override this method with its specific formatting logic
+     */
+    abstract formatMessages(messages: Message[], systemPrompt?: string, context?: string): Message[];
+
+    /**
+     * Get the maximum recommended context length for this provider
+     * Each provider should override this with appropriate value
+     */
+    abstract getMaxContextLength(): number;
+
+    /**
+     * Get the default system prompt
+     * Uses the default prompt from constants
+     */
+    protected getDefaultSystemPrompt(systemPrompt?: string): string {
+        return systemPrompt || DEFAULT_SYSTEM_PROMPT || PROVIDER_PROMPTS.COMMON.DEFAULT_ASSISTANT_INTRO;
+    }
+
+    /**
+     * Clean context content - common method with standard HTML cleaning
+     * Provider-specific formatters can override for custom behavior
+     */
+    cleanContextContent(content: string): string {
+        if (!content) return '';
+
+        try {
+            // First fix any encoding issues
+            const fixedContent = this.fixEncodingIssues(content);
+
+            // Convert HTML to markdown for better readability
+            const cleaned = sanitizeHtml(fixedContent, {
+                allowedTags: HTML_ALLOWED_TAGS.STANDARD,
+                allowedAttributes: HTML_ALLOWED_ATTRIBUTES.STANDARD,
+                transformTags: HTML_TRANSFORMS.STANDARD
+            });
+
+            // Process inline elements to markdown
+            let markdown = cleaned;
+
+            // Apply all HTML to Markdown patterns
+            const patterns = HTML_TO_MARKDOWN_PATTERNS;
+            for (const pattern of Object.values(patterns)) {
+                markdown = markdown.replace(pattern.pattern, pattern.replacement);
+            }
+
+            // Process list items
+            markdown = this.processListItems(markdown);
+
+            // Fix common HTML entities
+            const entityPatterns = HTML_ENTITY_REPLACEMENTS;
+            for (const pattern of Object.values(entityPatterns)) {
+                markdown = markdown.replace(pattern.pattern, pattern.replacement);
+            }
+
+            return markdown.trim();
+        } catch (error) {
+            console.error(FORMATTER_LOGS.ERROR.CONTEXT_CLEANING("Base"), error);
+            return content; // Return original if cleaning fails
+        }
+    }
+
+    /**
+     * Process HTML list items in markdown conversion
+     * This is a helper method that safely processes HTML list items
+     */
+    protected processListItems(content: string): string {
+        // Process unordered lists
+        let result = content.replace(/<ul[^>]*>([\s\S]*?)<\/ul>/gi, (match: string, listContent: string) => {
+            return listContent.replace(/<li[^>]*>([\s\S]*?)<\/li>/gi, '- $1\n');
+        });
+
+        // Process ordered lists
+        result = result.replace(/<ol[^>]*>([\s\S]*?)<\/ol>/gi, (match: string, listContent: string) => {
+            let index = 1;
+            return listContent.replace(/<li[^>]*>([\s\S]*?)<\/li>/gi, (itemMatch: string, item: string) => {
+                return `${index++}. ${item}\n`;
+            });
+        });
+
+        return result;
+    }
+
+    /**
+     * Fix common encoding issues in content
+     * This fixes issues like broken quote characters and other encoding problems
+     *
+     * @param content The content to fix encoding issues in
+     * @returns Content with encoding issues fixed
+     */
+    protected fixEncodingIssues(content: string): string {
+        if (!content) return '';
+
+        try {
+            // Fix common encoding issues
+            let fixed = content.replace(ENCODING_FIXES.BROKEN_QUOTES.pattern, ENCODING_FIXES.BROKEN_QUOTES.replacement);
+
+            // Fix other common broken unicode
+            fixed = fixed.replace(/[\u{0080}-\u{FFFF}]/gu, (match) => {
+                // Use replacements from constants
+                const replacements = ENCODING_FIXES.UNICODE_REPLACEMENTS;
+                return replacements[match as keyof typeof replacements] || match;
+            });
+
+            return fixed;
+        } catch (error) {
+            console.error(FORMATTER_LOGS.ERROR.ENCODING, error);
+            return content; // Return original if fixing fails
+        }
+    }
+}
diff --git a/src/services/llm/formatters/ollama_formatter.ts b/src/services/llm/formatters/ollama_formatter.ts
new file mode 100644
index 000000000..34a422a19
--- /dev/null
+++ b/src/services/llm/formatters/ollama_formatter.ts
@@ -0,0 +1,224 @@
+import type { Message } from '../ai_interface.js';
+import { BaseMessageFormatter } from './base_formatter.js';
+import sanitizeHtml from 'sanitize-html';
+import { PROVIDER_PROMPTS, FORMATTING_PROMPTS } from '../constants/llm_prompt_constants.js';
+import { LLM_CONSTANTS } from '../constants/provider_constants.js';
+import {
+    HTML_ALLOWED_TAGS,
+    HTML_ALLOWED_ATTRIBUTES,
+    OLLAMA_CLEANING,
+    FORMATTER_LOGS
+} from '../constants/formatter_constants.js';
+import log from '../../log.js';
+
+/**
+ * Ollama-specific message formatter
+ * Handles the unique requirements of the Ollama API
+ */
+export class OllamaMessageFormatter extends BaseMessageFormatter {
+    /**
+     * Maximum recommended context length for Ollama
+     * Smaller than other providers due to Ollama's handling of context
+     */
+    private static MAX_CONTEXT_LENGTH = LLM_CONSTANTS.CONTEXT_WINDOW.OLLAMA;
+
+    /**
+     * Format messages for the Ollama API
+     * @param messages Messages to format
+     * @param systemPrompt Optional system prompt to use
+     * @param context Optional context to include
+     * @param preserveSystemPrompt When true, preserves existing system messages rather than replacing them
+     */
+    formatMessages(messages: Message[], systemPrompt?: string, context?: string, preserveSystemPrompt?: boolean): Message[] {
+        const formattedMessages: Message[] = [];
+
+        // Log the input messages with all their properties
+        log.info(`Ollama formatter received ${messages.length} messages`);
+        messages.forEach((msg, index) => {
+            const msgKeys = Object.keys(msg);
+            log.info(`Message ${index} - role: ${msg.role}, keys: ${msgKeys.join(', ')}, content length: ${msg.content.length}`);
+            
+            // Log special properties if present
+            if (msg.tool_calls) {
+                log.info(`Message ${index} has ${msg.tool_calls.length} tool_calls`);
+            }
+            if (msg.tool_call_id) {
+                log.info(`Message ${index} has tool_call_id: ${msg.tool_call_id}`);
+            }
+            if (msg.name) {
+                log.info(`Message ${index} has name: ${msg.name}`);
+            }
+        });
+
+        // First identify user, system, and tool messages
+        const systemMessages = messages.filter(msg => msg.role === 'system');
+        const nonSystemMessages = messages.filter(msg => msg.role !== 'system');
+
+        // Determine if we should preserve the existing system message
+        if (preserveSystemPrompt && systemMessages.length > 0) {
+            // Preserve the existing system message
+            formattedMessages.push(systemMessages[0]);
+            log.info(`Preserving existing system message: ${systemMessages[0].content.substring(0, 50)}...`);
+        } else {
+            // Use provided systemPrompt or default
+            const basePrompt = systemPrompt || PROVIDER_PROMPTS.COMMON.DEFAULT_ASSISTANT_INTRO;
+            formattedMessages.push({
+                role: 'system',
+                content: basePrompt
+            });
+            log.info(`Using new system message: ${basePrompt.substring(0, 50)}...`);
+        }
+
+        // If we have context, inject it into the first user message
+        if (context && nonSystemMessages.length > 0) {
+            let injectedContext = false;
+
+            for (let i = 0; i < nonSystemMessages.length; i++) {
+                const msg = nonSystemMessages[i];
+
+                if (msg.role === 'user' && !injectedContext) {
+                    // Simple context injection directly in the user's message
+                    const cleanedContext = this.cleanContextContent(context);
+                    log.info(`Injecting context (${cleanedContext.length} chars) into user message`);
+
+                    const formattedContext = PROVIDER_PROMPTS.OLLAMA.CONTEXT_INJECTION(
+                        cleanedContext,
+                        msg.content
+                    );
+
+                    // Log what properties we're preserving
+                    const msgKeys = Object.keys(msg);
+                    const preservedKeys = msgKeys.filter(key => key !== 'role' && key !== 'content');
+                    log.info(`Preserving additional properties in user message: ${preservedKeys.join(', ')}`);
+
+                    // Create a new message with all original properties, but updated content
+                    const newMessage = {
+                        ...msg, // Copy all properties
+                        content: formattedContext // Override content with injected context
+                    };
+                    
+                    formattedMessages.push(newMessage);
+                    log.info(`Created user message with context, final keys: ${Object.keys(newMessage).join(', ')}`);
+
+                    injectedContext = true;
+                } else {
+                    // For other messages, preserve all properties including any tool-related ones
+                    log.info(`Preserving message with role ${msg.role}, keys: ${Object.keys(msg).join(', ')}`);
+                    
+                    formattedMessages.push({
+                        ...msg // Copy all properties
+                    });
+                }
+            }
+        } else {
+            // No context, just add all messages as-is
+            // Make sure to preserve all properties including tool_calls, tool_call_id, etc.
+            for (const msg of nonSystemMessages) {
+                log.info(`Adding message with role ${msg.role} without context injection, keys: ${Object.keys(msg).join(', ')}`);
+                formattedMessages.push({
+                    ...msg // Copy all properties
+                });
+            }
+        }
+
+        // Log the final formatted messages
+        log.info(`Ollama formatter produced ${formattedMessages.length} formatted messages`);
+        formattedMessages.forEach((msg, index) => {
+            const msgKeys = Object.keys(msg);
+            log.info(`Formatted message ${index} - role: ${msg.role}, keys: ${msgKeys.join(', ')}, content length: ${msg.content.length}`);
+            
+            // Log special properties if present
+            if (msg.tool_calls) {
+                log.info(`Formatted message ${index} has ${msg.tool_calls.length} tool_calls`);
+            }
+            if (msg.tool_call_id) {
+                log.info(`Formatted message ${index} has tool_call_id: ${msg.tool_call_id}`);
+            }
+            if (msg.name) {
+                log.info(`Formatted message ${index} has name: ${msg.name}`);
+            }
+        });
+
+        return formattedMessages;
+    }
+
+    /**
+     * Clean up HTML and other problematic content before sending to Ollama
+     * Ollama needs a more aggressive cleaning than other models,
+     * but we want to preserve our XML tags for context
+     */
+    override cleanContextContent(content: string): string {
+        if (!content) return '';
+
+        try {
+            // Store our XML tags so we can restore them after cleaning
+            const noteTagsRegex = /<\/?note>/g;
+            const notesTagsRegex = /<\/?notes>/g;
+            const queryTagsRegex = /<\/?query>[^<]*<\/query>/g;
+
+            // Capture tags to restore later
+            const noteTags = content.match(noteTagsRegex) || [];
+            const noteTagPositions: number[] = [];
+            let match;
+            const regex = /<\/?note>/g;
+            while ((match = regex.exec(content)) !== null) {
+                noteTagPositions.push(match.index);
+            }
+
+            // Remember the notes tags
+            const notesTagsMatch = content.match(notesTagsRegex) || [];
+            const notesTagPositions: number[] = [];
+            while ((match = notesTagsRegex.exec(content)) !== null) {
+                notesTagPositions.push(match.index);
+            }
+
+            // Remember the query tags
+            const queryTagsMatch = content.match(queryTagsRegex) || [];
+
+            // Temporarily replace XML tags with markers that won't be affected by sanitization
+            let modified = content
+                .replace(/<note>/g, '[NOTE_START]')
+                .replace(/<\/note>/g, '[NOTE_END]')
+                .replace(/<notes>/g, '[NOTES_START]')
+                .replace(/<\/notes>/g, '[NOTES_END]')
+                .replace(/<query>(.*?)<\/query>/g, '[QUERY]$1[/QUERY]');
+
+            // First use the parent class to do standard cleaning
+            let sanitized = super.cleanContextContent(modified);
+
+            // Then apply Ollama-specific aggressive cleaning
+            // Remove any remaining HTML using sanitizeHtml while keeping our markers
+            let plaintext = sanitizeHtml(sanitized, {
+                allowedTags: HTML_ALLOWED_TAGS.NONE,
+                allowedAttributes: HTML_ALLOWED_ATTRIBUTES.NONE,
+                textFilter: (text) => text
+            });
+
+            // Apply all Ollama-specific cleaning patterns
+            const ollamaPatterns = OLLAMA_CLEANING;
+            for (const pattern of Object.values(ollamaPatterns)) {
+                plaintext = plaintext.replace(pattern.pattern, pattern.replacement);
+            }
+
+            // Restore our XML tags
+            plaintext = plaintext
+                .replace(/\[NOTE_START\]/g, '<note>')
+                .replace(/\[NOTE_END\]/g, '</note>')
+                .replace(/\[NOTES_START\]/g, '<notes>')
+                .replace(/\[NOTES_END\]/g, '</notes>')
+                .replace(/\[QUERY\](.*?)\[\/QUERY\]/g, '<query>$1</query>');
+
+            return plaintext.trim();
+        } catch (error) {
+            console.error(FORMATTER_LOGS.ERROR.CONTEXT_CLEANING("Ollama"), error);
+            return content; // Return original if cleaning fails
+        }
+    }
+
+    /**
+     * Get the maximum recommended context length for Ollama
+     */
+    getMaxContextLength(): number {
+        return OllamaMessageFormatter.MAX_CONTEXT_LENGTH;
+    }
+}
diff --git a/src/services/llm/formatters/openai_formatter.ts b/src/services/llm/formatters/openai_formatter.ts
new file mode 100644
index 000000000..c42f2c5a8
--- /dev/null
+++ b/src/services/llm/formatters/openai_formatter.ts
@@ -0,0 +1,124 @@
+import sanitizeHtml from 'sanitize-html';
+import type { Message } from '../ai_interface.js';
+import { BaseMessageFormatter } from './base_formatter.js';
+import { PROVIDER_PROMPTS, FORMATTING_PROMPTS } from '../constants/llm_prompt_constants.js';
+import { LLM_CONSTANTS } from '../constants/provider_constants.js';
+import {
+    HTML_ALLOWED_TAGS,
+    HTML_ALLOWED_ATTRIBUTES,
+    HTML_TO_MARKDOWN_PATTERNS,
+    HTML_ENTITY_REPLACEMENTS,
+    FORMATTER_LOGS
+} from '../constants/formatter_constants.js';
+
+/**
+ * OpenAI-specific message formatter
+ * Optimized for OpenAI's API requirements and preferences
+ */
+export class OpenAIMessageFormatter extends BaseMessageFormatter {
+    /**
+     * Maximum recommended context length for OpenAI
+     * Based on GPT-4 context window size
+     */
+    private static MAX_CONTEXT_LENGTH = LLM_CONSTANTS.CONTEXT_WINDOW.OPENAI;
+
+    /**
+     * Format messages for the OpenAI API
+     */
+    formatMessages(messages: Message[], systemPrompt?: string, context?: string): Message[] {
+        const formattedMessages: Message[] = [];
+
+        // Check if we already have a system message
+        const hasSystemMessage = messages.some(msg => msg.role === 'system');
+        const userAssistantMessages = messages.filter(msg => msg.role === 'user' || msg.role === 'assistant');
+
+        // If we have explicit context, format it properly
+        if (context) {
+            // For OpenAI, it's best to put context in the system message
+            const formattedContext = PROVIDER_PROMPTS.OPENAI.SYSTEM_WITH_CONTEXT(
+                this.cleanContextContent(context)
+            );
+
+            // Add as system message
+            formattedMessages.push({
+                role: 'system',
+                content: formattedContext
+            });
+        }
+        // If we don't have explicit context but have a system prompt
+        else if (!hasSystemMessage && systemPrompt) {
+            formattedMessages.push({
+                role: 'system',
+                content: systemPrompt
+            });
+        }
+        // If neither context nor system prompt is provided, use default system prompt
+        else if (!hasSystemMessage) {
+            formattedMessages.push({
+                role: 'system',
+                content: this.getDefaultSystemPrompt(systemPrompt)
+            });
+        }
+        // Otherwise if there are existing system messages, keep them
+        else if (hasSystemMessage) {
+            // Keep any existing system messages
+            const systemMessages = messages.filter(msg => msg.role === 'system');
+            for (const msg of systemMessages) {
+                formattedMessages.push({
+                    role: 'system',
+                    content: this.cleanContextContent(msg.content)
+                });
+            }
+        }
+
+        // Add all user and assistant messages
+        for (const msg of userAssistantMessages) {
+            formattedMessages.push({
+                role: msg.role,
+                content: msg.content
+            });
+        }
+
+        console.log(FORMATTER_LOGS.OPENAI.PROCESSED(messages.length, formattedMessages.length));
+        return formattedMessages;
+    }
+
+    /**
+     * Clean context content for OpenAI
+     * OpenAI handles HTML better than Ollama but still benefits from some cleaning
+     */
+    cleanContextContent(content: string): string {
+        if (!content) return '';
+
+        try {
+            // Convert HTML to Markdown for better readability
+            const cleaned = sanitizeHtml(content, {
+                allowedTags: HTML_ALLOWED_TAGS.STANDARD,
+                allowedAttributes: HTML_ALLOWED_ATTRIBUTES.STANDARD
+            });
+
+            // Apply all HTML to Markdown patterns
+            let markdown = cleaned;
+            for (const pattern of Object.values(HTML_TO_MARKDOWN_PATTERNS)) {
+                markdown = markdown.replace(pattern.pattern, pattern.replacement);
+            }
+
+            // Fix common HTML entities
+            for (const pattern of Object.values(HTML_ENTITY_REPLACEMENTS)) {
+                markdown = markdown.replace(pattern.pattern, pattern.replacement);
+            }
+
+            return markdown.trim();
+        } catch (error) {
+            console.error(FORMATTER_LOGS.ERROR.CONTEXT_CLEANING("OpenAI"), error);
+            return content; // Return original if cleaning fails
+        }
+    }
+
+    /**
+     * Get the maximum recommended context length for OpenAI
+     */
+    getMaxContextLength(): number {
+        return OpenAIMessageFormatter.MAX_CONTEXT_LENGTH;
+    }
+}
diff --git a/src/services/llm/index_service.ts b/src/services/llm/index_service.ts
new file mode 100644
index 000000000..1fa1c9615
--- /dev/null
+++ b/src/services/llm/index_service.ts
@@ -0,0 +1,855 @@
+/**
+ * LLM Index Service
+ *
+ * Centralized service for managing knowledge base indexing for LLM features.
+ * This service coordinates:
+ * - Note embedding generation and management
+ * - Smart context retrieval for LLM queries
+ * - Progressive indexing of the knowledge base
+ * - Optimization of the semantic search capabilities
+ */
+
+import log from "../log.js";
+import options from "../options.js";
+import becca from "../../becca/becca.js";
+import vectorStore from "./embeddings/index.js";
+import providerManager from "./providers/providers.js";
+import { ContextExtractor } from "./context/index.js";
+import eventService from "../events.js";
+import type { NoteEmbeddingContext } from "./embeddings/embeddings_interface.js";
+import type { OptionDefinitions } from "../options_interface.js";
+import sql from "../sql.js";
+import sqlInit from "../sql_init.js";
+import { CONTEXT_PROMPTS } from './constants/llm_prompt_constants.js';
+import { SEARCH_CONSTANTS } from './constants/search_constants.js';
+
+class IndexService {
+    private initialized = false;
+    private indexingInProgress = false;
+    private contextExtractor = new ContextExtractor();
+    private automaticIndexingInterval?: NodeJS.Timeout;
+
+    // Index rebuilding tracking
+    private indexRebuildInProgress = false;
+    private indexRebuildProgress = 0;
+    private indexRebuildTotal = 0;
+    private indexRebuildCurrent = 0;
+
+    // Configuration
+    private defaultQueryDepth = SEARCH_CONSTANTS.HIERARCHY.DEFAULT_QUERY_DEPTH;
+    private maxNotesPerQuery = SEARCH_CONSTANTS.HIERARCHY.MAX_NOTES_PER_QUERY;
+    private defaultSimilarityThreshold = SEARCH_CONSTANTS.VECTOR_SEARCH.EXACT_MATCH_THRESHOLD;
+    private indexUpdateInterval = 3600000; // 1 hour in milliseconds
+
+    /**
+     * Initialize the index service
+     */
+    async initialize() {
+        if (this.initialized) return;
+
+        try {
+            // Check if database is initialized before proceeding
+            if (!sqlInit.isDbInitialized()) {
+                log.info("Index service: Database not initialized yet, skipping initialization");
+                return;
+            }
+
+            const aiEnabled = await options.getOptionBool('aiEnabled');
+            if (!aiEnabled) {
+                log.info("Index service: AI features disabled, skipping initialization");
+                return;
+            }
+
+            // Check if embedding system is ready
+            const providers = await providerManager.getEnabledEmbeddingProviders();
+            if (!providers || providers.length === 0) {
+                throw new Error("No embedding providers available");
+            }
+
+            // Check if this instance should process embeddings
+            const embeddingLocation = await options.getOption('embeddingGenerationLocation') || 'client';
+            const isSyncServer = await this.isSyncServerForEmbeddings();
+            const shouldProcessEmbeddings = embeddingLocation === 'client' || isSyncServer;
+
+            // Setup automatic indexing if enabled and this instance should process embeddings
+            if (await options.getOptionBool('embeddingAutoUpdateEnabled') && shouldProcessEmbeddings) {
+                this.setupAutomaticIndexing();
+                log.info(`Index service: Automatic indexing enabled, processing embeddings ${isSyncServer ? 'as sync server' : 'as client'}`);
+            } else if (await options.getOptionBool('embeddingAutoUpdateEnabled')) {
+                log.info("Index service: Automatic indexing enabled, but this instance is not configured to process embeddings");
+            }
+
+            // Listen for note changes to update index
+            this.setupEventListeners();
+
+            this.initialized = true;
+            log.info("Index service initialized successfully");
+        } catch (error: any) {
+            log.error(`Error initializing index service: ${error.message || "Unknown error"}`);
+            throw error;
+        }
+    }
+
+    /**
+     * Setup event listeners for index updates
+     */
+    private setupEventListeners() {
+        // Listen for note content changes
+        eventService.subscribe(eventService.NOTE_CONTENT_CHANGE, async ({ entity }) => {
+            if (entity && entity.noteId) {
+                // Always queue notes for indexing, but the actual processing will depend on configuration
+                await this.queueNoteForIndexing(entity.noteId);
+            }
+        });
+
+        // Listen for new notes
+        eventService.subscribe(eventService.ENTITY_CREATED, async ({ entityName, entity }) => {
+            if (entityName === "notes" && entity && entity.noteId) {
+                await this.queueNoteForIndexing(entity.noteId);
+            }
+        });
+
+        // Listen for note title changes
+        eventService.subscribe(eventService.NOTE_TITLE_CHANGED, async ({ noteId }) => {
+            if (noteId) {
+                await this.queueNoteForIndexing(noteId);
+            }
+        });
+
+        // Listen for changes in AI settings
+        eventService.subscribe(eventService.ENTITY_CHANGED, async ({ entityName, entity }) => {
+            if (entityName === "options" && entity && entity.name) {
+                if (entity.name.startsWith('ai') || entity.name.startsWith('embedding')) {
+                    log.info("AI settings changed, updating index service configuration");
+                    await this.updateConfiguration();
+                }
+            }
+        });
+    }
+
+    /**
+     * Set up automatic indexing of notes
+     */
+    private setupAutomaticIndexing() {
+        // Clear existing interval if any
+        if (this.automaticIndexingInterval) {
+            clearInterval(this.automaticIndexingInterval);
+        }
+
+        // Create new interval
+        this.automaticIndexingInterval = setInterval(async () => {
+            try {
+                if (!this.indexingInProgress) {
+                    // Check if this instance should process embeddings
+                    const embeddingLocation = await options.getOption('embeddingGenerationLocation') || 'client';
+                    const isSyncServer = await this.isSyncServerForEmbeddings();
+                    const shouldProcessEmbeddings = embeddingLocation === 'client' || isSyncServer;
+
+                    if (!shouldProcessEmbeddings) {
+                        // This instance is not configured to process embeddings
+                        return;
+                    }
+
+                    const stats = await vectorStore.getEmbeddingStats();
+
+                    // Only run automatic indexing if we're below 95% completion
+                    if (stats.percentComplete < 95) {
+                        log.info(`Starting automatic indexing (current completion: ${stats.percentComplete}%)`);
+                        await this.runBatchIndexing(50); // Process 50 notes at a time
+                    }
+                }
+            } catch (error: any) {
+                log.error(`Error in automatic indexing: ${error.message || "Unknown error"}`);
+            }
+        }, this.indexUpdateInterval);
+
+        log.info("Automatic indexing scheduled");
+    }
+
+    /**
+     * Update service configuration from options
+     */
+    private async updateConfiguration() {
+        try {
+            // Update indexing interval
+            const intervalMs = parseInt(await options.getOption('embeddingUpdateInterval') || '3600000', 10);
+            this.indexUpdateInterval = intervalMs;
+
+            // Check if this instance should process embeddings
+            const embeddingLocation = await options.getOption('embeddingGenerationLocation') || 'client';
+            const isSyncServer = await this.isSyncServerForEmbeddings();
+            const shouldProcessEmbeddings = embeddingLocation === 'client' || isSyncServer;
+
+            // Update automatic indexing setting
+            const autoIndexing = await options.getOptionBool('embeddingAutoUpdateEnabled');
+            if (autoIndexing && shouldProcessEmbeddings && !this.automaticIndexingInterval) {
+                this.setupAutomaticIndexing();
+                log.info(`Index service: Automatic indexing enabled, processing embeddings ${isSyncServer ? 'as sync server' : 'as client'}`);
+            } else if (autoIndexing && !shouldProcessEmbeddings && this.automaticIndexingInterval) {
+                clearInterval(this.automaticIndexingInterval);
+                this.automaticIndexingInterval = undefined;
+                log.info("Index service: Automatic indexing disabled for this instance based on configuration");
+            } else if (!autoIndexing && this.automaticIndexingInterval) {
+                clearInterval(this.automaticIndexingInterval);
+                this.automaticIndexingInterval = undefined;
+            }
+
+            // Update similarity threshold
+            const similarityThreshold = await options.getOption('embeddingSimilarityThreshold');
+            this.defaultSimilarityThreshold = parseFloat(similarityThreshold || '0.65');
+
+            // Update max notes per query
+            const maxNotesPerQuery = await options.getOption('maxNotesPerLlmQuery');
+            this.maxNotesPerQuery = parseInt(maxNotesPerQuery || '10', 10);
+
+            log.info("Index service configuration updated");
+        } catch (error: any) {
+            log.error(`Error updating index service configuration: ${error.message || "Unknown error"}`);
+        }
+    }
+
+    /**
+     * Queue a note for indexing
+     */
+    async queueNoteForIndexing(noteId: string, priority = false) {
+        if (!this.initialized) {
+            await this.initialize();
+        }
+
+        try {
+            // Always queue notes for indexing, regardless of where embedding generation happens
+            // The actual processing will be determined when the queue is processed
+            await vectorStore.queueNoteForEmbedding(noteId, 'UPDATE');
+            return true;
+        } catch (error: any) {
+            log.error(`Error queueing note ${noteId} for indexing: ${error.message || "Unknown error"}`);
+            return false;
+        }
+    }
+
+    /**
+     * Start full knowledge base indexing
+     * @param force - Whether to force reindexing of all notes
+     */
+    async startFullIndexing(force = false) {
+        if (!this.initialized) {
+            await this.initialize();
+        }
+
+        if (this.indexingInProgress) {
+            throw new Error("Indexing already in progress");
+        }
+
+        try {
+            // Check if this instance should process embeddings
+            const embeddingLocation = await options.getOption('embeddingGenerationLocation') || 'client';
+            const isSyncServer = await this.isSyncServerForEmbeddings();
+            const shouldProcessEmbeddings = embeddingLocation === 'client' || isSyncServer;
+
+            if (!shouldProcessEmbeddings) {
+                // This instance is not configured to process embeddings
+                log.info("Skipping full indexing as this instance is not configured to process embeddings");
+                return false;
+            }
+
+            this.indexingInProgress = true;
+            this.indexRebuildInProgress = true;
+            this.indexRebuildProgress = 0;
+            this.indexRebuildCurrent = 0;
+
+            // Reset index rebuild progress
+            const totalEmbeddings = await sql.getValue("SELECT COUNT(*) FROM note_embeddings") as number;
+
+            if (totalEmbeddings === 0) {
+                // If there are no embeddings yet, we need to create them first
+                const totalNotes = await sql.getValue("SELECT COUNT(*) FROM notes WHERE isDeleted = 0") as number;
+                this.indexRebuildTotal = totalNotes;
+
+                log.info("No embeddings found, starting full embedding generation first");
+                await vectorStore.reprocessAllNotes();
+                log.info("Full embedding generation initiated");
+            } else {
+                // For index rebuild, use the number of embeddings as the total
+                this.indexRebuildTotal = totalEmbeddings;
+
+                if (force) {
+                    // Use the new rebuildSearchIndex function that doesn't regenerate embeddings
+                    log.info("Starting forced index rebuild without regenerating embeddings");
+                    setTimeout(async () => {
+                        try {
+                            await vectorStore.rebuildSearchIndex();
+                            this.indexRebuildInProgress = false;
+                            this.indexRebuildProgress = 100;
+                            log.info("Index rebuild completed successfully");
+                        } catch (error: any) {
+                            log.error(`Error during index rebuild: ${error.message || "Unknown error"}`);
+                            this.indexRebuildInProgress = false;
+                        }
+                    }, 0);
+                } else {
+                    // Check current stats
+                    const stats = await vectorStore.getEmbeddingStats();
+
+                    // Only start indexing if we're below 90% completion or if embeddings exist but need optimization
+                    if (stats.percentComplete < 90) {
+                        log.info("Embedding coverage below 90%, starting full embedding generation");
+                        await vectorStore.reprocessAllNotes();
+                        log.info("Full embedding generation initiated");
+                    } else {
+                        log.info(`Embedding coverage at ${stats.percentComplete}%, starting index optimization`);
+                        setTimeout(async () => {
+                            try {
+                                await vectorStore.rebuildSearchIndex();
+                                this.indexRebuildInProgress = false;
+                                this.indexRebuildProgress = 100;
+                                log.info("Index optimization completed successfully");
+                            } catch (error: any) {
+                                log.error(`Error during index optimization: ${error.message || "Unknown error"}`);
+                                this.indexRebuildInProgress = false;
+                            }
+                        }, 0);
+                    }
+                }
+            }
+
+            return true;
+        } catch (error: any) {
+            log.error(`Error starting full indexing: ${error.message || "Unknown error"}`);
+            this.indexRebuildInProgress = false;
+            return false;
+        } finally {
+            this.indexingInProgress = false;
+        }
+    }
+
+    /**
+     * Update index rebuild progress
+     * @param processed - Number of notes processed
+     */
+    updateIndexRebuildProgress(processed: number) {
+        if (!this.indexRebuildInProgress) return;
+
+        this.indexRebuildCurrent += processed;
+
+        if (this.indexRebuildTotal > 0) {
+            this.indexRebuildProgress = Math.min(
+                Math.round((this.indexRebuildCurrent / this.indexRebuildTotal) * 100),
+                100
+            );
+        }
+
+        if (this.indexRebuildCurrent >= this.indexRebuildTotal) {
+            this.indexRebuildInProgress = false;
+            this.indexRebuildProgress = 100;
+        }
+    }
+
+    /**
+     * Get the current index rebuild progress
+     */
+    getIndexRebuildStatus() {
+        return {
+            inProgress: this.indexRebuildInProgress,
+            progress: this.indexRebuildProgress,
+            total: this.indexRebuildTotal,
+            current: this.indexRebuildCurrent
+        };
+    }
+
+    /**
+     * Run a batch indexing job for a limited number of notes
+     * @param batchSize - Maximum number of notes to process
+     */
+    async runBatchIndexing(batchSize = 20) {
+        if (!this.initialized) {
+            await this.initialize();
+        }
+
+        if (this.indexingInProgress) {
+            return false;
+        }
+
+        try {
+            this.indexingInProgress = true;
+
+            // Check if this instance should process embeddings
+            const embeddingLocation = await options.getOption('embeddingGenerationLocation') || 'client';
+            const isSyncServer = await this.isSyncServerForEmbeddings();
+            const shouldProcessEmbeddings = embeddingLocation === 'client' || isSyncServer;
+
+            if (!shouldProcessEmbeddings) {
+                // This instance is not configured to process embeddings
+                log.info("Skipping batch indexing as this instance is not configured to process embeddings");
+                return false;
+            }
+
+            // Process the embedding queue
+            await vectorStore.processEmbeddingQueue();
+
+            return true;
+        } catch (error: any) {
+            log.error(`Error in batch indexing: ${error.message || "Unknown error"}`);
+            return false;
+        } finally {
+            this.indexingInProgress = false;
+        }
+    }
+
+    /**
+     * Get the current indexing statistics
+     */
+    async getIndexingStats() {
+        if (!this.initialized) {
+            await this.initialize();
+        }
+
+        try {
+            const stats = await vectorStore.getEmbeddingStats();
+
+            return {
+                ...stats,
+                isIndexing: this.indexingInProgress,
+                automaticIndexingEnabled: !!this.automaticIndexingInterval
+            };
+        } catch (error: any) {
+            log.error(`Error getting indexing stats: ${error.message || "Unknown error"}`);
+            return {
+                totalNotesCount: 0,
+                embeddedNotesCount: 0,
+                queuedNotesCount: 0,
+                failedNotesCount: 0,
+                percentComplete: 0,
+                isIndexing: this.indexingInProgress,
+                automaticIndexingEnabled: !!this.automaticIndexingInterval,
+                error: error.message || "Unknown error"
+            };
+        }
+    }
+
+    /**
+     * Get information about failed embedding attempts
+     */
+    async getFailedIndexes(limit = 100) {
+        if (!this.initialized) {
+            await this.initialize();
+        }
+
+        try {
+            return await vectorStore.getFailedEmbeddingNotes(limit);
+        } catch (error: any) {
+            log.error(`Error getting failed indexes: ${error.message || "Unknown error"}`);
+            return [];
+        }
+    }
+
+    /**
+     * Retry indexing a specific note that previously failed
+     */
+    async retryFailedNote(noteId: string) {
+        if (!this.initialized) {
+            await this.initialize();
+        }
+
+        try {
+            return await vectorStore.retryFailedEmbedding(noteId);
+        } catch (error: any) {
+            log.error(`Error retrying failed note ${noteId}: ${error.message || "Unknown error"}`);
+            return false;
+        }
+    }
+
+    /**
+     * Retry all failed indexing operations
+     */
+    async retryAllFailedNotes() {
+        if (!this.initialized) {
+            await this.initialize();
+        }
+
+        try {
+            const count = await vectorStore.retryAllFailedEmbeddings();
+            log.info(`Queued ${count} failed notes for retry`);
+            return count;
+        } catch (error: any) {
+            log.error(`Error retrying all failed notes: ${error.message || "Unknown error"}`);
+            return 0;
+        }
+    }
+
+    /**
+     * Find semantically similar notes to a given query
+     * @param query - Text query to find similar notes for
+     * @param contextNoteId - Optional note ID to restrict search to a branch
+     * @param limit - Maximum number of results to return
+     */
+    async findSimilarNotes(
+        query: string,
+        contextNoteId?: string,
+        limit = 10
+    ) {
+        if (!this.initialized) {
+            await this.initialize();
+        }
+
+        try {
+            // Get all enabled embedding providers
+            const providers = await providerManager.getEnabledEmbeddingProviders();
+            if (!providers || providers.length === 0) {
+                throw new Error("No embedding providers available");
+            }
+
+            // Get the embedding provider precedence
+            const options = (await import('../options.js')).default;
+            let preferredProviders: string[] = [];
+
+            const embeddingPrecedence = await options.getOption('embeddingProviderPrecedence');
+            let provider;
+
+            if (embeddingPrecedence) {
+                // Parse the precedence string
+                if (embeddingPrecedence.startsWith('[') && embeddingPrecedence.endsWith(']')) {
+                    preferredProviders = JSON.parse(embeddingPrecedence);
+                } else if (typeof embeddingPrecedence === 'string') {
+                    if (embeddingPrecedence.includes(',')) {
+                        preferredProviders = embeddingPrecedence.split(',').map(p => p.trim());
+                    } else {
+                        preferredProviders = [embeddingPrecedence];
+                    }
+                }
+
+                // Find first enabled provider by precedence order
+                for (const providerName of preferredProviders) {
+                    const matchedProvider = providers.find(p => p.name === providerName);
+                    if (matchedProvider) {
+                        provider = matchedProvider;
+                        break;
+                    }
+                }
+
+                // If no match found, use first available
+                if (!provider && providers.length > 0) {
+                    provider = providers[0];
+                }
+            } else {
+                // Default to first available provider
+                provider = providers[0];
+            }
+
+            if (!provider) {
+                throw new Error("No suitable embedding provider found");
+            }
+
+            log.info(`Searching with embedding provider: ${provider.name}, model: ${provider.getConfig().model}`);
+
+            // Generate embedding for the query
+            const embedding = await provider.generateEmbeddings(query);
+            log.info(`Generated embedding for query: "${query}" (${embedding.length} dimensions)`);
+
+            // Add the original query as a property to the embedding
+            // This is used for title matching in the vector search
+            Object.defineProperty(embedding, 'originalQuery', {
+                value: query,
+                writable: false,
+                enumerable: true,
+                configurable: false
+            });
+
+            // Store query text in a global cache for possible regeneration with different providers
+            // Use a type declaration to avoid TypeScript errors
+            interface CustomGlobal {
+                recentEmbeddingQueries?: Record<string, string>;
+            }
+            const globalWithCache = global as unknown as CustomGlobal;
+
+            if (!globalWithCache.recentEmbeddingQueries) {
+                globalWithCache.recentEmbeddingQueries = {};
+            }
+
+            // Use a substring of the embedding as a key (full embedding is too large)
+            const embeddingKey = embedding.toString().substring(0, 100);
+            globalWithCache.recentEmbeddingQueries[embeddingKey] = query;
+
+            // Limit cache size to prevent memory leaks (keep max 50 recent queries)
+            const keys = Object.keys(globalWithCache.recentEmbeddingQueries);
+            if (keys.length > 50) {
+                delete globalWithCache.recentEmbeddingQueries[keys[0]];
+            }
+
+            // Get Note IDs to search, optionally filtered by branch
+            let similarNotes: { noteId: string; title: string; similarity: number; contentType?: string }[] = [];
+
+            // Check if we need to restrict search to a specific branch
+            if (contextNoteId) {
+                const note = becca.getNote(contextNoteId);
+                if (!note) {
+                    throw new Error(`Context note ${contextNoteId} not found`);
+                }
+
+                // Get all note IDs in the branch
+                const branchNoteIds = new Set<string>();
+                const collectNoteIds = (noteId: string) => {
+                    branchNoteIds.add(noteId);
+                    const note = becca.getNote(noteId);
+                    if (note) {
+                        for (const childNote of note.getChildNotes()) {
+                            if (!branchNoteIds.has(childNote.noteId)) {
+                                collectNoteIds(childNote.noteId);
+                            }
+                        }
+                    }
+                };
+
+                collectNoteIds(contextNoteId);
+
+                // Get embeddings for all notes in the branch
+                const config = provider.getConfig();
+
+                // Import the ContentType detection from vector utils
+                const { ContentType, detectContentType, cosineSimilarity } = await import('./embeddings/vector_utils.js');
+
+                for (const noteId of branchNoteIds) {
+                    const noteEmbedding = await vectorStore.getEmbeddingForNote(
+                        noteId,
+                        provider.name,
+                        config.model
+                    );
+
+                    if (noteEmbedding) {
+                        // Get the note to determine its content type
+                        const note = becca.getNote(noteId);
+                        if (note) {
+                            // Detect content type from mime type
+                            const contentType = detectContentType(note.mime, '');
+
+                            // Use content-aware similarity calculation
+                            const similarity = cosineSimilarity(
+                                embedding,
+                                noteEmbedding.embedding,
+                                true, // normalize
+                                config.model, // source model
+                                noteEmbedding.providerId, // target model (use providerId)
+                                contentType, // content type for padding strategy
+                                undefined // use default BALANCED performance profile
+                            );
+
+                            if (similarity >= this.defaultSimilarityThreshold) {
+                                similarNotes.push({
+                                    noteId,
+                                    title: note.title,
+                                    similarity,
+                                    contentType: contentType.toString()
+                                });
+                            }
+                        }
+                    }
+                }
+
+                // Sort by similarity and return top results
+                return similarNotes
+                    .sort((a, b) => b.similarity - a.similarity)
+                    .slice(0, limit);
+            } else {
+                // Search across all notes
+                const config = provider.getConfig();
+                const results = await vectorStore.findSimilarNotes(
+                    embedding,
+                    provider.name,
+                    config.model,
+                    limit,
+                    this.defaultSimilarityThreshold
+                );
+
+                // Enhance results with note titles
+                similarNotes = results.map(result => {
+                    const note = becca.getNote(result.noteId);
+                    return {
+                        noteId: result.noteId,
+                        title: note ? note.title : 'Unknown Note',
+                        similarity: result.similarity,
+                        contentType: result.contentType
+                    };
+                });
+
+                return similarNotes;
+            }
+        } catch (error: any) {
+            log.error(`Error finding similar notes: ${error.message || "Unknown error"}`);
+            return [];
+        }
+    }
+
+    /**
+     * Generate context for an LLM query based on relevance to the user's question
+     * @param query - The user's question
+     * @param contextNoteId - Optional ID of a note to use as context root
+     * @param depth - Depth of context to include (1-4)
+     */
+    async generateQueryContext(
+        query: string,
+        contextNoteId?: string,
+        depth = 2
+    ) {
+        if (!this.initialized) {
+            await this.initialize();
+        }
+
+        try {
+            // Find similar notes to the query
+            const similarNotes = await this.findSimilarNotes(
+                query,
+                contextNoteId,
+                this.maxNotesPerQuery
+            );
+
+            if (similarNotes.length === 0) {
+                return CONTEXT_PROMPTS.INDEX_NO_NOTES_CONTEXT;
+            }
+
+            // Build context from the similar notes
+            let context = `I found some relevant information in your notes that may help answer: "${query}"\n\n`;
+
+            for (const note of similarNotes) {
+                const noteObj = becca.getNote(note.noteId);
+                if (!noteObj) continue;
+
+                context += `## ${noteObj.title}\n`;
+
+                // Add parent context for better understanding
+                const parents = noteObj.getParentNotes();
+                if (parents.length > 0) {
+                    context += `Path: ${parents.map(p => p.title).join(' > ')}\n`;
+                }
+
+                // Add content based on depth
+                if (depth >= 2) {
+                    const content = await this.contextExtractor.getNoteContent(note.noteId);
+                    if (content) {
+                        // For larger content, use summary
+                        if (content.length > 2000) {
+                            const summary = await this.contextExtractor.summarizeContent(content, noteObj.title);
+                            context += `${summary}\n[Content summarized due to length]\n\n`;
+                        } else {
+                            context += `${content}\n\n`;
+                        }
+                    }
+                }
+
+                // Add child note titles for more context if depth >= 3
+                if (depth >= 3) {
+                    const childNotes = noteObj.getChildNotes();
+                    if (childNotes.length > 0) {
+                        context += `Child notes: ${childNotes.slice(0, 5).map(n => n.title).join(', ')}`;
+                        if (childNotes.length > 5) {
+                            context += ` and ${childNotes.length - 5} more`;
+                        }
+                        context += `\n\n`;
+                    }
+                }
+
+                // Add attribute context for even deeper understanding if depth >= 4
+                if (depth >= 4) {
+                    const attributes = noteObj.getOwnedAttributes();
+                    if (attributes.length > 0) {
+                        const relevantAttrs = attributes.filter(a =>
+                            !a.name.startsWith('_') && !a.name.startsWith('child:') && !a.name.startsWith('relation:')
+                        );
+
+                        if (relevantAttrs.length > 0) {
+                            context += `Attributes: ${relevantAttrs.map(a =>
+                                `${a.type === 'label' ? '#' : '~'}${a.name}${a.value ? '=' + a.value : ''}`
+                            ).join(', ')}\n\n`;
+                        }
+                    }
+                }
+            }
+
+            // Add instructions about how to reference the notes
+            context += "When referring to information from these notes in your response, please cite them by their titles " +
+                      "(e.g., \"According to your note on [Title]...\"). If the information doesn't contain what you need, " +
+                      "just say so and use your general knowledge instead.";
+
+            return context;
+        } catch (error: any) {
+            log.error(`Error generating query context: ${error.message || "Unknown error"}`);
+            return "I'm an AI assistant helping with your Trilium notes. I encountered an error while retrieving context from your notes, but I'll try to assist based on general knowledge.";
+        }
+    }
+
+    /**
+     * Check if this instance is a sync server and should generate embeddings
+     */
+    async isSyncServerForEmbeddings() {
+        // Check if this is a sync server (no syncServerHost means this is a sync server)
+        const syncServerHost = await options.getOption('syncServerHost');
+        const isSyncServer = !syncServerHost;
+
+        // Check if embedding generation should happen on the sync server
+        const embeddingLocation = await options.getOption('embeddingGenerationLocation') || 'client';
+        const shouldGenerateOnSyncServer = embeddingLocation === 'sync_server';
+
+        return isSyncServer && shouldGenerateOnSyncServer;
+    }
+
+    /**
+     * Generate a comprehensive index entry for a note
+     * This prepares all metadata and contexts for optimal LLM retrieval
+     */
+    async generateNoteIndex(noteId: string) {
+        if (!this.initialized) {
+            await this.initialize();
+        }
+
+        try {
+            const note = becca.getNote(noteId);
+            if (!note) {
+                throw new Error(`Note ${noteId} not found`);
+            }
+
+            // Check where embedding generation should happen
+            const embeddingLocation = await options.getOption('embeddingGenerationLocation') || 'client';
+
+            // If embedding generation should happen on the sync server and we're not the sync server,
+            // just queue the note for embedding but don't generate it
+            const isSyncServer = await this.isSyncServerForEmbeddings();
+            const shouldSkipGeneration = embeddingLocation === 'sync_server' && !isSyncServer;
+
+            if (shouldSkipGeneration) {
+                // We're not the sync server, so just queue the note for embedding
+                // The sync server will handle the actual embedding generation
+                log.info(`Note ${noteId} queued for embedding generation on sync server`);
+                return true;
+            }
+
+            // Get complete note context for indexing
+            const context = await vectorStore.getNoteEmbeddingContext(noteId);
+
+            // Queue note for embedding with all available providers
+            const providers = await providerManager.getEnabledEmbeddingProviders();
+            for (const provider of providers) {
+                try {
+                    const embedding = await provider.generateNoteEmbeddings(context);
+                    if (embedding) {
+                        const config = provider.getConfig();
+                        await vectorStore.storeNoteEmbedding(
+                            noteId,
+                            provider.name,
+                            config.model,
+                            embedding
+                        );
+                    }
+                } catch (error: any) {
+                    log.error(`Error generating embedding with provider ${provider.name} for note ${noteId}: ${error.message || "Unknown error"}`);
+                }
+            }
+
+            return true;
+        } catch (error: any) {
+            log.error(`Error generating note index for ${noteId}: ${error.message || "Unknown error"}`);
+            return false;
+        }
+    }
+}
+
+// Create singleton instance
+const indexService = new IndexService();
+export default indexService;
diff --git a/src/services/llm/interfaces/agent_tool_interfaces.ts b/src/services/llm/interfaces/agent_tool_interfaces.ts
new file mode 100644
index 000000000..38051437e
--- /dev/null
+++ b/src/services/llm/interfaces/agent_tool_interfaces.ts
@@ -0,0 +1,147 @@
+import type { ChatResponse } from '../ai_interface.js';
+import type { VectorSearchResult } from '../context_extractors/vector_search_tool.js';
+import type { NoteInfo, NotePathInfo, NoteHierarchyLevel } from '../context_extractors/note_navigator_tool.js';
+import type { DecomposedQuery, SubQuery } from '../context_extractors/query_decomposition_tool.js';
+import type { ThinkingProcess, ThinkingStep } from '../context_extractors/contextual_thinking_tool.js';
+import type BAttribute from '../../../becca/entities/battribute.js';
+
+/**
+ * Interface for the AI service used by agent tools
+ */
+export interface LLMServiceInterface {
+    generateChatCompletion(messages: Array<{
+        role: 'user' | 'assistant' | 'system';
+        content: string;
+    }>, options?: {
+        temperature?: number;
+        maxTokens?: number;
+        model?: string;
+        stream?: boolean;
+        systemPrompt?: string;
+    }): Promise<ChatResponse>;
+}
+
+/**
+ * Interface for tool initialization
+ */
+export interface AgentToolInitializationParams {
+    aiServiceManager: LLMServiceInterface;
+}
+
+/**
+ * Interface for agent tool manager
+ */
+export interface IAgentToolsManager {
+    initialize(aiServiceManager: LLMServiceInterface): Promise<void>;
+    isInitialized(): boolean;
+    getAllTools(): {
+        vectorSearch: IVectorSearchTool;
+        noteNavigator: INoteNavigatorTool;
+        queryDecomposition: IQueryDecompositionTool;
+        contextualThinking: IContextualThinkingTool;
+    };
+    getVectorSearchTool(): IVectorSearchTool;
+    getNoteNavigatorTool(): INoteNavigatorTool;
+    getQueryDecompositionTool(): IQueryDecompositionTool;
+    getContextualThinkingTool(): IContextualThinkingTool;
+}
+
+/**
+ * Interface for context service used by vector search
+ */
+export interface IContextService {
+    findRelevantNotesMultiQuery(queries: string[], contextNoteId: string | null, limit: number): Promise<VectorSearchResult[]>;
+    processQuery(userQuestion: string, llmService: LLMServiceInterface, contextNoteId: string | null, showThinking: boolean): Promise<{
+        context: string;
+        sources: Array<{
+            noteId: string;
+            title: string;
+            similarity: number;
+        }>;
+        thinking?: string;
+    }>;
+}
+
+/**
+ * Interface for vector search tool
+ */
+export interface IVectorSearchTool {
+    setContextService(contextService: IContextService): void;
+    search(
+        query: string,
+        contextNoteId?: string,
+        searchOptions?: {
+            limit?: number;
+            threshold?: number;
+            includeContent?: boolean;
+        }
+    ): Promise<VectorSearchResult[]>;
+    searchNotes(query: string, options?: {
+        parentNoteId?: string;
+        maxResults?: number;
+        similarityThreshold?: number;
+    }): Promise<VectorSearchResult[]>;
+    searchContentChunks(query: string, options?: {
+        noteId?: string;
+        maxResults?: number;
+        similarityThreshold?: number;
+    }): Promise<VectorSearchResult[]>;
+    explainResults(query: string, results: VectorSearchResult[]): string;
+}
+
+/**
+ * Interface for note navigator tool
+ */
+export interface INoteNavigatorTool {
+    getNoteInfo(noteId: string): NoteInfo | null;
+    getNotePathsFromRoot(noteId: string): NotePathInfo[];
+    getNoteHierarchy(noteId: string, depth?: number): NoteHierarchyLevel | null;
+    getNoteAttributes(noteId: string): BAttribute[];
+    findPathBetweenNotes(fromNoteId: string, toNoteId: string): NotePathInfo | null;
+    searchNotesByTitle(searchTerm: string, limit?: number): NoteInfo[];
+    getNoteClones(noteId: string): Promise<NoteInfo[]>;
+    getNoteContextDescription(noteId: string): Promise<string>;
+    getNoteStructure(noteId: string): Promise<{
+        noteId: string;
+        title: string;
+        type: string;
+        childCount: number;
+        attributes: Array<{ name: string, value: string }>;
+        parentPath: Array<{ title: string, noteId: string }>;
+    }>;
+    getChildNotes(noteId: string, limit?: number): Promise<Array<{ noteId: string, title: string }>>;
+    getParentNotes(noteId: string): Promise<Array<{ noteId: string, title: string }>>;
+    getLinkedNotes(noteId: string, limit?: number): Promise<Array<{ noteId: string, title: string, direction: 'from' | 'to' }>>;
+    getNotePath(noteId: string): Promise<string>;
+}
+
+/**
+ * Interface for query decomposition tool
+ */
+export interface IQueryDecompositionTool {
+    decomposeQuery(query: string, context?: string): DecomposedQuery;
+    updateSubQueryAnswer(decomposedQuery: DecomposedQuery, subQueryId: string, answer: string): DecomposedQuery;
+    synthesizeAnswer(decomposedQuery: DecomposedQuery): string;
+    getQueryStatus(decomposedQuery: DecomposedQuery): string;
+    assessQueryComplexity(query: string): number;
+    generateSubQueryId(): string;
+    createSubQueries(query: string, context?: string): SubQuery[];
+}
+
+/**
+ * Interface for contextual thinking tool
+ */
+export interface IContextualThinkingTool {
+    startThinking(query: string): string;
+    addThinkingStep(
+        processId: string,
+        step: Omit<ThinkingStep, 'id'>,
+        parentId?: string
+    ): string;
+    completeThinking(processId?: string): ThinkingProcess | null;
+    getThinkingProcess(processId: string): ThinkingProcess | null;
+    getActiveThinkingProcess(): ThinkingProcess | null;
+    visualizeThinking(thinkingId: string): string;
+    getThinkingSummary(thinkingId: string): string;
+    resetActiveThinking(): void;
+}
diff --git a/src/services/llm/interfaces/ai_service_interfaces.ts b/src/services/llm/interfaces/ai_service_interfaces.ts
new file mode 100644
index 000000000..3126691a4
--- /dev/null
+++ b/src/services/llm/interfaces/ai_service_interfaces.ts
@@ -0,0 +1,52 @@
+import type { AIService, Message, ChatCompletionOptions, ChatResponse } from '../ai_interface.js';
+
+/**
+ * Interface for any LLM provider metadata
+ */
+export interface ProviderMetadata {
+  name: string;
+  capabilities: {
+    chat: boolean;
+    embeddings: boolean;
+    streaming: boolean;
+    functionCalling?: boolean;
+  };
+  models: string[];
+  defaultModel?: string;
+}
+
+/**
+ * Interface for AI service manager configuration
+ */
+export interface AIServiceManagerConfig {
+  defaultProvider?: string;
+  fallbackProviders?: string[];
+  customModels?: Record<string, string>;
+}
+
+/**
+ * Interface for managing AI service providers
+ */
+export interface IAIServiceManager {
+  getService(provider?: string): AIService;
+  getAvailableProviders(): string[];
+  getPreferredProvider(): string;
+  isProviderAvailable(provider: string): boolean;
+  getProviderMetadata(provider: string): ProviderMetadata | null;
+  getAIEnabled(): boolean;
+}
+
+/**
+ * Type for service providers
+ */
+export type ServiceProviders = 'openai' | 'anthropic' | 'ollama';
+
+/**
+ * LLM model configuration
+ */
+export interface ModelConfig {
+  provider: string;
+  model: string;
+  maxTokens?: number;
+  temperature?: number;
+}
diff --git a/src/services/llm/interfaces/chat_session.ts b/src/services/llm/interfaces/chat_session.ts
new file mode 100644
index 000000000..f5dfc1db3
--- /dev/null
+++ b/src/services/llm/interfaces/chat_session.ts
@@ -0,0 +1,37 @@
+/**
+ * Interfaces for chat sessions and related data
+ */
+import type { Message } from "../ai_interface.js";
+
+/**
+ * Represents a source note from which context is drawn
+ */
+export interface NoteSource {
+    noteId: string;
+    title: string;
+    content?: string;
+    similarity?: number;
+    branchId?: string;
+}
+
+/**
+ * Represents a chat session with message history
+ */
+export interface ChatSession {
+    id: string;
+    title: string;
+    messages: ChatMessage[];
+    createdAt: Date;
+    lastActive: Date;
+    noteContext?: string;
+    metadata: Record<string, any>;
+}
+
+/**
+ * Represents a single chat message
+ */
+export interface ChatMessage {
+    role: 'user' | 'assistant' | 'system';
+    content: string;
+    timestamp?: Date;
+}
diff --git a/src/services/llm/interfaces/chat_ws_messages.ts b/src/services/llm/interfaces/chat_ws_messages.ts
new file mode 100644
index 000000000..f75d399f4
--- /dev/null
+++ b/src/services/llm/interfaces/chat_ws_messages.ts
@@ -0,0 +1,24 @@
+/**
+ * Interfaces for WebSocket LLM streaming messages
+ */
+
+/**
+ * Interface for WebSocket LLM streaming messages
+ */
+export interface LLMStreamMessage {
+    type: 'llm-stream' | 'tool_execution_start' | 'tool_result' | 'tool_execution_error' | 'tool_completion_processing';
+    chatNoteId: string;
+    content?: string;
+    thinking?: string;
+    toolExecution?: {
+        action?: string;
+        tool?: string;
+        toolCallId?: string;
+        result?: string | Record<string, any>;
+        error?: string;
+        args?: Record<string, unknown>;
+    };
+    done?: boolean;
+    error?: string;
+    raw?: unknown;
+}
diff --git a/src/services/llm/interfaces/context_interfaces.ts b/src/services/llm/interfaces/context_interfaces.ts
new file mode 100644
index 000000000..a23a374db
--- /dev/null
+++ b/src/services/llm/interfaces/context_interfaces.ts
@@ -0,0 +1,127 @@
+/**
+ * Interface for note data in cache
+ */
+export interface CachedNoteData<T> {
+  timestamp: number;
+  data: T;
+}
+
+/**
+ * Interface for query results in cache
+ */
+export interface CachedQueryResults<T> {
+  timestamp: number;
+  results: T;
+}
+
+/**
+ * Interface for cache manager
+ */
+export interface ICacheManager {
+  getNoteData<T>(noteId: string, type: string): T | null;
+  storeNoteData<T>(noteId: string, type: string, data: T): void;
+  getQueryResults<T>(query: string, contextNoteId: string | null): T | null;
+  storeQueryResults<T>(query: string, results: T, contextNoteId: string | null): void;
+  cleanupCache(): void;
+  clearAllCaches(): void;
+}
+
+/**
+ * Interface for note data in search results
+ */
+export interface NoteSearchResult {
+  noteId: string;
+  title: string;
+  content: string | null;
+  similarity: number;
+  parentId?: string;
+  parentPath?: string;
+  type?: string;
+  mime?: string;
+  parentTitle?: string;
+  dateCreated?: string;
+  dateModified?: string;
+}
+
+/**
+ * Interface for context formatter
+ */
+export interface IContextFormatter {
+  buildContextFromNotes(
+    sources: NoteSearchResult[],
+    query: string,
+    providerId?: string,
+    messages?: Array<{role: string, content: string}>
+  ): Promise<string>;
+}
+
+/**
+ * Interface for LLM Service
+ */
+export interface ILLMService {
+  sendMessage(message: string, options?: Record<string, unknown>): Promise<string>;
+  generateEmbedding?(text: string): Promise<number[]>;
+  streamMessage?(message: string, callback: (text: string) => void, options?: Record<string, unknown>): Promise<string>;
+}
+
+/**
+ * Interface for query enhancer
+ */
+export interface IQueryEnhancer {
+  generateSearchQueries(question: string, llmService: ILLMService): Promise<string[]>;
+  estimateQueryComplexity(query: string): number;
+}
+
+/**
+ * Interface for content chunk
+ */
+export interface ContentChunk {
+  content: string;
+  metadata?: Record<string, unknown>;
+}
+
+/**
+ * Interface for note chunk
+ */
+export interface NoteChunk {
+  noteId: string;
+  title: string;
+  content: string;
+  type?: string;
+  metadata?: Record<string, unknown>;
+}
+
+/**
+ * Interface for content chunking service
+ */
+export interface IContentChunker {
+  chunkContent(content: string, metadata?: Record<string, unknown>): ContentChunk[];
+  chunkNoteContent(noteId: string, content: string, title: string): Promise<NoteChunk[]>;
+}
+
+/**
+ * Options for context service
+ */
+export interface ContextServiceOptions {
+  maxResults?: number;
+  summarize?: boolean;
+  llmService?: ILLMService;
+}
+
+/**
+ * Interface for context service
+ */
+export interface IContextService {
+  initialize(): Promise<void>;
+  processQuery(
+    userQuestion: string,
+    llmService: ILLMService,
+    contextNoteId?: string | null,
+    showThinking?: boolean
+  ): Promise<{ context: string; sources: NoteSearchResult[]; thinking?: string }>;
+  findRelevantNotes(
+    query: string,
+    contextNoteId?: string | null,
+    options?: ContextServiceOptions
+  ): Promise<NoteSearchResult[]>;
+}
diff --git a/src/services/llm/interfaces/embedding_interfaces.ts b/src/services/llm/interfaces/embedding_interfaces.ts
new file mode 100644
index 000000000..eaecd4cf9
--- /dev/null
+++ b/src/services/llm/interfaces/embedding_interfaces.ts
@@ -0,0 +1,108 @@
+/**
+ * Interface for embedding provider configuration
+ */
+export interface EmbeddingProviderConfig {
+  name: string;
+  model: string;
+  dimension: number;
+  type: 'float32' | 'int8' | 'uint8' | 'float16';
+  enabled?: boolean;
+  priority?: number;
+  baseUrl?: string;
+  apiKey?: string;
+  contextWidth?: number;
+  batchSize?: number;
+}
+
+/**
+ * Interface for embedding model information
+ */
+export interface EmbeddingModelInfo {
+  name: string;
+  dimension: number;
+  contextWidth?: number;
+  maxBatchSize?: number;
+  tokenizer?: string;
+  type: 'float32' | 'int8' | 'uint8' | 'float16';
+}
+
+/**
+ * Interface for embedding provider
+ */
+export interface EmbeddingProvider {
+  getName(): string;
+  getModel(): string;
+  getDimension(): number;
+  getType(): 'float32' | 'int8' | 'uint8' | 'float16';
+  isEnabled(): boolean;
+  getPriority(): number;
+  getMaxBatchSize(): number;
+  generateEmbedding(text: string): Promise<Float32Array>;
+  generateBatchEmbeddings(texts: string[]): Promise<Float32Array[]>;
+  initialize(): Promise<void>;
+}
+
+/**
+ * Interface for embedding process result
+ */
+export interface EmbeddingProcessResult {
+  noteId: string;
+  title: string;
+  success: boolean;
+  message?: string;
+  error?: Error;
+  chunks?: number;
+}
+
+/**
+ * Interface for embedding queue item
+ */
+export interface EmbeddingQueueItem {
+  id: number;
+  noteId: string;
+  status: 'pending' | 'processing' | 'completed' | 'failed' | 'retrying';
+  provider: string;
+  model: string;
+  dimension: number;
+  type: string;
+  attempts: number;
+  lastAttempt: string | null;
+  dateCreated: string;
+  dateCompleted: string | null;
+  error: string | null;
+  chunks: number;
+}
+
+/**
+ * Interface for embedding batch processing
+ */
+export interface EmbeddingBatch {
+  texts: string[];
+  noteIds: string[];
+  indexes: number[];
+}
+
+/**
+ * Interface for embedding search result
+ */
+export interface EmbeddingSearchResult {
+  noteId: string;
+  similarity: number;
+  title?: string;
+  content?: string;
+  parentId?: string;
+  parentTitle?: string;
+  dateCreated?: string;
+  dateModified?: string;
+}
+
+/**
+ * Interface for embedding chunk
+ */
+export interface EmbeddingChunk {
+  id: number;
+  noteId: string;
+  content: string;
+  embedding: Float32Array | Int8Array | Uint8Array;
+  metadata?: Record<string, unknown>;
+}
diff --git a/src/services/llm/interfaces/error_interfaces.ts b/src/services/llm/interfaces/error_interfaces.ts
new file mode 100644
index 000000000..542b497f5
--- /dev/null
+++ b/src/services/llm/interfaces/error_interfaces.ts
@@ -0,0 +1,78 @@
+/**
+ * Standard error interface for LLM services
+ */
+export interface LLMServiceError extends Error {
+  message: string;
+  name: string;
+  code?: string;
+  status?: number;
+  cause?: unknown;
+  stack?: string;
+}
+
+/**
+ * Provider-specific error interface for OpenAI
+ */
+export interface OpenAIError extends LLMServiceError {
+  status: number;
+  headers?: Record<string, string>;
+  type?: string;
+  code?: string;
+  param?: string;
+}
+
+/**
+ * Provider-specific error interface for Anthropic
+ */
+export interface AnthropicError extends LLMServiceError {
+  status: number;
+  type?: string;
+}
+
+/**
+ * Provider-specific error interface for Ollama
+ */
+export interface OllamaError extends LLMServiceError {
+  code?: string;
+}
+
+/**
+ * Embedding-specific error interface
+ */
+export interface EmbeddingError extends LLMServiceError {
+  provider: string;
+  model?: string;
+  batchSize?: number;
+  isRetryable: boolean;
+}
+
+/**
+ * Guard function to check if an error is a specific type of error
+ */
+export function isLLMServiceError(error: unknown): error is LLMServiceError {
+  return (
+    typeof error === 'object' &&
+    error !== null &&
+    'message' in error &&
+    typeof (error as LLMServiceError).message === 'string'
+  );
+}
+
+/**
+ * Guard function to check if an error is a batch size error
+ */
+export function isBatchSizeError(error: unknown): boolean {
+  if (!isLLMServiceError(error)) {
+    return false;
+  }
+
+  const errorMessage = error.message.toLowerCase();
+  return (
+    errorMessage.includes('batch size') ||
+    errorMessage.includes('too many items') ||
+    errorMessage.includes('too many inputs') ||
+    errorMessage.includes('context length') ||
+    errorMessage.includes('token limit') ||
+    (error.code !== undefined && ['context_length_exceeded', 'token_limit_exceeded'].includes(error.code))
+  );
+}
diff --git a/src/services/llm/interfaces/message_formatter.ts b/src/services/llm/interfaces/message_formatter.ts
new file mode 100644
index 000000000..3ec387d0a
--- /dev/null
+++ b/src/services/llm/interfaces/message_formatter.ts
@@ -0,0 +1,92 @@
+import type { Message } from "../ai_interface.js";
+// These imports need to be added for the factory to work
+import { OpenAIMessageFormatter } from "../formatters/openai_formatter.js";
+import { OllamaMessageFormatter } from "../formatters/ollama_formatter.js";
+
+/**
+ * Interface for provider-specific message formatters
+ * This allows each provider to have custom formatting logic while maintaining a consistent interface
+ */
+export interface MessageFormatter {
+    /**
+     * Format messages for a specific LLM provider
+     *
+     * @param messages Array of messages to format
+     * @param systemPrompt Optional system prompt to include
+     * @param context Optional context to incorporate into messages
+     * @returns Formatted messages ready to send to the provider
+     */
+    formatMessages(messages: Message[], systemPrompt?: string, context?: string): Message[];
+
+    /**
+     * Clean context content to prepare it for this specific provider
+     *
+     * @param content The raw context content
+     * @returns Cleaned and formatted context content
+     */
+    cleanContextContent(content: string): string;
+
+    /**
+     * Get the maximum recommended context length for this provider
+     *
+     * @returns Maximum context length in characters
+     */
+    getMaxContextLength(): number;
+}
+
+/**
+ * Factory to get the appropriate message formatter for a provider
+ */
+export class MessageFormatterFactory {
+    // Cache formatters for reuse
+    private static formatters: Record<string, MessageFormatter> = {};
+
+    /**
+     * Get the appropriate message formatter for a provider
+     *
+     * @param providerName Name of the LLM provider (e.g., 'openai', 'anthropic', 'ollama')
+     * @returns MessageFormatter instance for the specified provider
+     */
+    static getFormatter(providerName: string): MessageFormatter {
+        // Normalize provider name and handle variations
+        let providerKey: string;
+
+        // Normalize provider name from various forms (constructor.name, etc.)
+        if (providerName.toLowerCase().includes('openai')) {
+            providerKey = 'openai';
+        } else if (providerName.toLowerCase().includes('anthropic') ||
+                  providerName.toLowerCase().includes('claude')) {
+            providerKey = 'anthropic';
+        } else if (providerName.toLowerCase().includes('ollama')) {
+            providerKey = 'ollama';
+        } else {
+            // Default to lowercase of whatever name we got
+            providerKey = providerName.toLowerCase();
+        }
+
+        // Return cached formatter if available
+        if (this.formatters[providerKey]) {
+            return this.formatters[providerKey];
+        }
+
+        // Create and cache new formatter
+        switch (providerKey) {
+            case 'openai':
+                this.formatters[providerKey] = new OpenAIMessageFormatter();
+                break;
+            case 'anthropic':
+                console.warn('Anthropic formatter not available, using OpenAI formatter as fallback');
+                this.formatters[providerKey] = new OpenAIMessageFormatter();
+                break;
+            case 'ollama':
+                this.formatters[providerKey] = new OllamaMessageFormatter();
+                break;
+            default:
+                // Default to OpenAI formatter for unknown providers
+                console.warn(`No specific formatter for provider: ${providerName}. Using OpenAI formatter as default.`);
+                this.formatters[providerKey] = new OpenAIMessageFormatter();
+        }
+
+        return this.formatters[providerKey];
+    }
+}
diff --git a/src/services/llm/interfaces/model_capabilities.ts b/src/services/llm/interfaces/model_capabilities.ts
new file mode 100644
index 000000000..ce340bd13
--- /dev/null
+++ b/src/services/llm/interfaces/model_capabilities.ts
@@ -0,0 +1,138 @@
+import type { Message } from '../ai_interface.js';
+
+/**
+ * Interface for model capabilities information
+ */
+export interface ModelCapabilities {
+    contextWindowTokens: number;  // Context window size in tokens
+    contextWindowChars: number;   // Estimated context window size in characters (for planning)
+    maxCompletionTokens: number;  // Maximum completion length
+    hasFunctionCalling: boolean;  // Whether the model supports function calling
+    hasVision: boolean;           // Whether the model supports image input
+    costPerInputToken: number;    // Cost per input token (if applicable)
+    costPerOutputToken: number;   // Cost per output token (if applicable)
+}
+
+/**
+ * Default model capabilities for unknown models
+ */
+export const DEFAULT_MODEL_CAPABILITIES: ModelCapabilities = {
+    contextWindowTokens: 8192,
+    contextWindowChars: 16000,  // ~4 chars per token estimate
+    maxCompletionTokens: 1024,
+    hasFunctionCalling: false,
+    hasVision: false,
+    costPerInputToken: 0,
+    costPerOutputToken: 0
+};
+
+/**
+ * Model capabilities for common models
+ */
+export const MODEL_CAPABILITIES: Record<string, Partial<ModelCapabilities>> = {
+    // OpenAI models
+    'gpt-3.5-turbo': {
+        contextWindowTokens: 8192,
+        contextWindowChars: 16000,
+        hasFunctionCalling: true
+    },
+    'gpt-3.5-turbo-16k': {
+        contextWindowTokens: 16384,
+        contextWindowChars: 65000,
+        hasFunctionCalling: true
+    },
+    'gpt-4': {
+        contextWindowTokens: 8192,
+        contextWindowChars: 32000,
+        hasFunctionCalling: true
+    },
+    'gpt-4-32k': {
+        contextWindowTokens: 32768,
+        contextWindowChars: 130000,
+        hasFunctionCalling: true
+    },
+    'gpt-4-turbo': {
+        contextWindowTokens: 128000,
+        contextWindowChars: 512000,
+        hasFunctionCalling: true,
+        hasVision: true
+    },
+    'gpt-4o': {
+        contextWindowTokens: 128000,
+        contextWindowChars: 512000,
+        hasFunctionCalling: true,
+        hasVision: true
+    },
+
+    // Anthropic models
+    'claude-3-haiku': {
+        contextWindowTokens: 200000,
+        contextWindowChars: 800000,
+        hasVision: true
+    },
+    'claude-3-sonnet': {
+        contextWindowTokens: 200000,
+        contextWindowChars: 800000,
+        hasVision: true
+    },
+    'claude-3-opus': {
+        contextWindowTokens: 200000,
+        contextWindowChars: 800000,
+        hasVision: true
+    },
+    'claude-2': {
+        contextWindowTokens: 100000,
+        contextWindowChars: 400000
+    },
+
+    // Ollama models (defaults, will be updated dynamically)
+    'llama3': {
+        contextWindowTokens: 8192,
+        contextWindowChars: 32000
+    },
+    'mistral': {
+        contextWindowTokens: 8192,
+        contextWindowChars: 32000
+    },
+    'llama2': {
+        contextWindowTokens: 8192,
+        contextWindowChars: 16000
+    }
+};
+
+/**
+ * Calculate available context window size for context generation
+ * This takes into account expected message sizes and other overhead
+ *
+ * @param model Model name
+ * @param messages Current conversation messages
+ * @param expectedTurns Number of expected additional conversation turns
+ * @returns Available context size in characters
+ */
+export function calculateAvailableContextSize(
+    modelCapabilities: ModelCapabilities,
+    messages: Message[],
+    expectedTurns: number = 3
+): number {
+    // Calculate current message token usage (rough estimate)
+    let currentMessageChars = 0;
+    for (const message of messages) {
+        currentMessageChars += message.content.length;
+    }
+
+    // Reserve space for system prompt and overhead
+    const systemPromptReserve = 1000;
+
+    // Reserve space for expected conversation turns
+    const turnReserve = expectedTurns * 2000; // Average 2000 chars per turn (including both user and assistant)
+
+    // Calculate available space
+    const totalReserved = currentMessageChars + systemPromptReserve + turnReserve;
+    const availableContextSize = Math.max(0, modelCapabilities.contextWindowChars - totalReserved);
+
+    // Use at most 70% of total context window size to be safe
+    const maxSafeContextSize = Math.floor(modelCapabilities.contextWindowChars * 0.7);
+
+    // Return the smaller of available size or max safe size
+    return Math.min(availableContextSize, maxSafeContextSize);
+}
diff --git a/src/services/llm/model_capabilities_service.ts b/src/services/llm/model_capabilities_service.ts
new file mode 100644
index 000000000..c327ebc9d
--- /dev/null
+++ b/src/services/llm/model_capabilities_service.ts
@@ -0,0 +1,159 @@
+import log from '../log.js';
+import type { ModelCapabilities } from './interfaces/model_capabilities.js';
+import { MODEL_CAPABILITIES, DEFAULT_MODEL_CAPABILITIES } from './interfaces/model_capabilities.js';
+import aiServiceManager from './ai_service_manager.js';
+import { getEmbeddingProvider } from './providers/providers.js';
+import type { BaseEmbeddingProvider } from './embeddings/base_embeddings.js';
+import type { EmbeddingModelInfo } from './interfaces/embedding_interfaces.js';
+
+// Define a type for embedding providers that might have the getModelInfo method
+interface EmbeddingProviderWithModelInfo {
+    getModelInfo?: (modelName: string) => Promise<EmbeddingModelInfo>;
+}
+
+/**
+ * Service for fetching and caching model capabilities
+ */
+export class ModelCapabilitiesService {
+    // Cache model capabilities
+    private capabilitiesCache: Map<string, ModelCapabilities> = new Map();
+
+    constructor() {
+        // Initialize cache with known models
+        this.initializeCache();
+    }
+
+    /**
+     * Initialize the cache with known model capabilities
+     */
+    private initializeCache() {
+        // Add all predefined model capabilities to cache
+        for (const [model, capabilities] of Object.entries(MODEL_CAPABILITIES)) {
+            this.capabilitiesCache.set(model, {
+                ...DEFAULT_MODEL_CAPABILITIES,
+                ...capabilities
+            });
+        }
+    }
+
+    /**
+     * Get model capabilities, fetching from provider if needed
+     *
+     * @param modelName Full model name (with or without provider prefix)
+     * @returns Model capabilities
+     */
+    async getModelCapabilities(modelName: string): Promise<ModelCapabilities> {
+        // Handle provider-prefixed model names (e.g., "openai:gpt-4")
+        let provider = 'default';
+        let baseModelName = modelName;
+
+        if (modelName.includes(':')) {
+            const parts = modelName.split(':');
+            provider = parts[0];
+            baseModelName = parts[1];
+        }
+
+        // Check cache first
+        const cacheKey = baseModelName;
+        if (this.capabilitiesCache.has(cacheKey)) {
+            return this.capabilitiesCache.get(cacheKey)!;
+        }
+
+        // Fetch from provider if possible
+        try {
+            // Get provider service
+            const providerService = aiServiceManager.getService(provider);
+
+            if (providerService && typeof (providerService as any).getModelCapabilities === 'function') {
+                // If provider supports direct capability fetching, use it
+                const capabilities = await (providerService as any).getModelCapabilities(baseModelName);
+
+                if (capabilities) {
+                    // Merge with defaults and cache
+                    const fullCapabilities = {
+                        ...DEFAULT_MODEL_CAPABILITIES,
+                        ...capabilities
+                    };
+
+                    this.capabilitiesCache.set(cacheKey, fullCapabilities);
+                    log.info(`Fetched capabilities for ${modelName}: context window ${fullCapabilities.contextWindowTokens} tokens`);
+
+                    return fullCapabilities;
+                }
+            }
+
+            // Try to fetch from embedding provider if available
+            const embeddingProvider = getEmbeddingProvider(provider);
+
+            if (embeddingProvider) {
+                try {
+                    // Cast to a type that might have getModelInfo method
+                    const providerWithModelInfo = embeddingProvider as unknown as EmbeddingProviderWithModelInfo;
+
+                    if (providerWithModelInfo.getModelInfo) {
+                        const modelInfo = await providerWithModelInfo.getModelInfo(baseModelName);
+
+                        if (modelInfo && modelInfo.contextWidth) {
+                            // Convert to our capabilities format
+                            const capabilities: ModelCapabilities = {
+                                ...DEFAULT_MODEL_CAPABILITIES,
+                                contextWindowTokens: modelInfo.contextWidth,
+                                contextWindowChars: modelInfo.contextWidth * 4 // Rough estimate: 4 chars per token
+                            };
+
+                            this.capabilitiesCache.set(cacheKey, capabilities);
+                            log.info(`Derived capabilities for ${modelName} from embedding provider: context window ${capabilities.contextWindowTokens} tokens`);
+
+                            return capabilities;
+                        }
+                    }
+                } catch (error) {
+                    log.info(`Could not get model info from embedding provider for ${modelName}: ${error}`);
+                }
+            }
+        } catch (error) {
+            log.error(`Error fetching model capabilities for ${modelName}: ${error}`);
+        }
+
+        // If we get here, try to find a similar model in our predefined list
+        for (const knownModel of Object.keys(MODEL_CAPABILITIES)) {
+            // Check if the model name contains this known model (e.g., "gpt-4-1106-preview" contains "gpt-4")
+            if (baseModelName.includes(knownModel)) {
+                const capabilities = {
+                    ...DEFAULT_MODEL_CAPABILITIES,
+                    ...MODEL_CAPABILITIES[knownModel]
+                };
+
+                this.capabilitiesCache.set(cacheKey, capabilities);
+                log.info(`Using similar model (${knownModel}) capabilities for ${modelName}`);
+
+                return capabilities;
+            }
+        }
+
+        // Fall back to defaults if nothing else works
+        log.info(`Using default capabilities for unknown model ${modelName}`);
+        this.capabilitiesCache.set(cacheKey, DEFAULT_MODEL_CAPABILITIES);
+
+        return DEFAULT_MODEL_CAPABILITIES;
+    }
+
+    /**
+     * Update model capabilities in the cache
+     *
+     * @param modelName Model name
+     * @param capabilities Capabilities to update
+     */
+    updateModelCapabilities(modelName: string, capabilities: Partial<ModelCapabilities>) {
+        const currentCapabilities = this.capabilitiesCache.get(modelName) || DEFAULT_MODEL_CAPABILITIES;
+
+        this.capabilitiesCache.set(modelName, {
+            ...currentCapabilities,
+            ...capabilities
+        });
+    }
+}
+
+// Create and export singleton instance
+const modelCapabilitiesService = new ModelCapabilitiesService();
+export default modelCapabilitiesService;
diff --git a/src/services/llm/pipeline/chat_pipeline.ts b/src/services/llm/pipeline/chat_pipeline.ts
new file mode 100644
index 000000000..947a562e6
--- /dev/null
+++ b/src/services/llm/pipeline/chat_pipeline.ts
@@ -0,0 +1,970 @@
+import type { ChatPipelineInput, ChatPipelineConfig, PipelineMetrics, StreamCallback } from './interfaces.js';
+import type { ChatResponse, StreamChunk, Message } from '../ai_interface.js';
+import { ContextExtractionStage } from './stages/context_extraction_stage.js';
+import { SemanticContextExtractionStage } from './stages/semantic_context_extraction_stage.js';
+import { AgentToolsContextStage } from './stages/agent_tools_context_stage.js';
+import { MessagePreparationStage } from './stages/message_preparation_stage.js';
+import { ModelSelectionStage } from './stages/model_selection_stage.js';
+import { LLMCompletionStage } from './stages/llm_completion_stage.js';
+import { ResponseProcessingStage } from './stages/response_processing_stage.js';
+import { ToolCallingStage } from './stages/tool_calling_stage.js';
+import { VectorSearchStage } from './stages/vector_search_stage.js';
+import toolRegistry from '../tools/tool_registry.js';
+import toolInitializer from '../tools/tool_initializer.js';
+import log from '../../log.js';
+import type { LLMServiceInterface } from '../interfaces/agent_tool_interfaces.js';
+import { SEARCH_CONSTANTS } from '../constants/search_constants.js';
+
+/**
+ * Pipeline for managing the entire chat flow
+ * Implements a modular, composable architecture where each stage is a separate component
+ */
+export class ChatPipeline {
+    stages: {
+        contextExtraction: ContextExtractionStage;
+        semanticContextExtraction: SemanticContextExtractionStage;
+        agentToolsContext: AgentToolsContextStage;
+        messagePreparation: MessagePreparationStage;
+        modelSelection: ModelSelectionStage;
+        llmCompletion: LLMCompletionStage;
+        responseProcessing: ResponseProcessingStage;
+        toolCalling: ToolCallingStage;
+        vectorSearch: VectorSearchStage;
+    };
+
+    config: ChatPipelineConfig;
+    metrics: PipelineMetrics;
+
+    /**
+     * Create a new chat pipeline
+     * @param config Optional pipeline configuration
+     */
+    constructor(config?: Partial<ChatPipelineConfig>) {
+        // Initialize all pipeline stages
+        this.stages = {
+            contextExtraction: new ContextExtractionStage(),
+            semanticContextExtraction: new SemanticContextExtractionStage(),
+            agentToolsContext: new AgentToolsContextStage(),
+            messagePreparation: new MessagePreparationStage(),
+            modelSelection: new ModelSelectionStage(),
+            llmCompletion: new LLMCompletionStage(),
+            responseProcessing: new ResponseProcessingStage(),
+            toolCalling: new ToolCallingStage(),
+            vectorSearch: new VectorSearchStage()
+        };
+
+        // Set default configuration values
+        this.config = {
+            enableStreaming: true,
+            enableMetrics: true,
+            maxToolCallIterations: SEARCH_CONSTANTS.TOOL_EXECUTION.MAX_TOOL_CALL_ITERATIONS,
+            ...config
+        };
+
+        // Initialize metrics
+        this.metrics = {
+            totalExecutions: 0,
+            averageExecutionTime: 0,
+            stageMetrics: {}
+        };
+
+        // Initialize stage metrics
+        Object.keys(this.stages).forEach(stageName => {
+            this.metrics.stageMetrics[stageName] = {
+                totalExecutions: 0,
+                averageExecutionTime: 0
+            };
+        });
+    }
+
+    /**
+     * Execute the chat pipeline
+     * This is the main entry point that orchestrates all pipeline stages
+     */
+    async execute(input: ChatPipelineInput): Promise<ChatResponse> {
+        log.info(`========== STARTING CHAT PIPELINE ==========`);
+        log.info(`Executing chat pipeline with ${input.messages.length} messages`);
+        const startTime = Date.now();
+        this.metrics.totalExecutions++;
+
+        // Initialize streaming handler if requested
+        let streamCallback = input.streamCallback;
+        let accumulatedText = '';
+
+        try {
+            // Extract content length for model selection
+            let contentLength = 0;
+            for (const message of input.messages) {
+                contentLength += message.content.length;
+            }
+
+            // Initialize tools if needed
+            try {
+                const toolCount = toolRegistry.getAllTools().length;
+
+                // If there are no tools registered, initialize them
+                if (toolCount === 0) {
+                    log.info('No tools found in registry, initializing tools...');
+                    // Tools are already initialized in the AIServiceManager constructor
+                    // No need to initialize them again
+                    log.info(`Tools initialized, now have ${toolRegistry.getAllTools().length} tools`);
+                } else {
+                    log.info(`Found ${toolCount} tools already registered`);
+                }
+            } catch (error: any) {
+                log.error(`Error checking/initializing tools: ${error.message || String(error)}`);
+            }
+
+            // First, select the appropriate model based on query complexity and content length
+            const modelSelectionStartTime = Date.now();
+            log.info(`========== MODEL SELECTION ==========`);
+            const modelSelection = await this.stages.modelSelection.execute({
+                options: input.options,
+                query: input.query,
+                contentLength
+            });
+            this.updateStageMetrics('modelSelection', modelSelectionStartTime);
+            log.info(`Selected model: ${modelSelection.options.model || 'default'}, enableTools: ${modelSelection.options.enableTools}`);
+
+            // Determine if we should use tools or semantic context
+            const useTools = modelSelection.options.enableTools === true;
+            const useEnhancedContext = input.options?.useAdvancedContext === true;
+
+            // Log details about the advanced context parameter
+            log.info(`Enhanced context option check: input.options=${JSON.stringify(input.options || {})}`);
+            log.info(`Enhanced context decision: useEnhancedContext=${useEnhancedContext}, hasQuery=${!!input.query}`);
+
+            // Early return if we don't have a query or enhanced context is disabled
+            if (!input.query || !useEnhancedContext) {
+                log.info(`========== SIMPLE QUERY MODE ==========`);
+                log.info('Enhanced context disabled or no query provided, skipping context enrichment');
+
+                // Prepare messages without additional context
+                const messagePreparationStartTime = Date.now();
+                const preparedMessages = await this.stages.messagePreparation.execute({
+                    messages: input.messages,
+                    systemPrompt: input.options?.systemPrompt,
+                    options: modelSelection.options
+                });
+                this.updateStageMetrics('messagePreparation', messagePreparationStartTime);
+
+                // Generate completion using the LLM
+                const llmStartTime = Date.now();
+                const completion = await this.stages.llmCompletion.execute({
+                    messages: preparedMessages.messages,
+                    options: modelSelection.options
+                });
+                this.updateStageMetrics('llmCompletion', llmStartTime);
+
+                return completion.response;
+            }
+
+            // STAGE 1: Start with the user's query
+            const userQuery = input.query || '';
+            log.info(`========== STAGE 1: USER QUERY ==========`);
+            log.info(`Processing query with: question="${userQuery.substring(0, 50)}...", noteId=${input.noteId}, showThinking=${input.showThinking}`);
+
+            // STAGE 2: Perform query decomposition using the LLM
+            log.info(`========== STAGE 2: QUERY DECOMPOSITION ==========`);
+            log.info('Performing query decomposition to generate effective search queries');
+            const llmService = await this.getLLMService();
+            let searchQueries = [userQuery];
+
+            if (llmService) {
+                try {
+                    // Import the query processor and use its decomposeQuery method
+                    const queryProcessor = (await import('../context/services/query_processor.js')).default;
+
+                    // Use the enhanced query processor with the LLM service
+                    const decomposedQuery = await queryProcessor.decomposeQuery(userQuery, undefined, llmService);
+
+                    if (decomposedQuery && decomposedQuery.subQueries && decomposedQuery.subQueries.length > 0) {
+                        // Extract search queries from the decomposed query
+                        searchQueries = decomposedQuery.subQueries.map(sq => sq.text);
+
+                        // Always include the original query if it's not already included
+                        if (!searchQueries.includes(userQuery)) {
+                            searchQueries.unshift(userQuery);
+                        }
+
+                        log.info(`Query decomposed with complexity ${decomposedQuery.complexity}/10 into ${searchQueries.length} search queries`);
+                    } else {
+                        log.info('Query decomposition returned no sub-queries, using original query');
+                    }
+                } catch (error: any) {
+                    log.error(`Error in query decomposition: ${error.message || String(error)}`);
+                }
+            } else {
+                log.info('No LLM service available for query decomposition, using original query');
+            }
+
+            // STAGE 3: Execute vector similarity search with decomposed queries
+            const vectorSearchStartTime = Date.now();
+            log.info(`========== STAGE 3: VECTOR SEARCH ==========`);
+            log.info('Using VectorSearchStage pipeline component to find relevant notes');
+            log.info(`Searching with ${searchQueries.length} queries from decomposition`);
+
+            // Use the vectorSearchStage with multiple queries
+            const vectorSearchResult = await this.stages.vectorSearch.execute({
+                query: userQuery, // Original query as fallback
+                queries: searchQueries, // All decomposed queries
+                noteId: input.noteId || 'global',
+                options: {
+                    maxResults: SEARCH_CONSTANTS.CONTEXT.MAX_SIMILAR_NOTES,
+                    useEnhancedQueries: false, // We're already using enhanced queries from decomposition
+                    threshold: SEARCH_CONSTANTS.VECTOR_SEARCH.DEFAULT_THRESHOLD,
+                    llmService: llmService || undefined
+                }
+            });
+
+            this.updateStageMetrics('vectorSearch', vectorSearchStartTime);
+            log.info(`Vector search found ${vectorSearchResult.searchResults.length} relevant notes across ${searchQueries.length} queries`);
+
+            // Extract context from search results
+            log.info(`========== SEMANTIC CONTEXT EXTRACTION ==========`);
+            const semanticContextStartTime = Date.now();
+            const semanticContext = await this.stages.semanticContextExtraction.execute({
+                noteId: input.noteId || 'global',
+                query: userQuery,
+                messages: input.messages,
+                searchResults: vectorSearchResult.searchResults
+            });
+
+            const context = semanticContext.context;
+            this.updateStageMetrics('semanticContextExtraction', semanticContextStartTime);
+            log.info(`Extracted semantic context (${context.length} chars)`);
+
+            // STAGE 4: Prepare messages with context and tool definitions for the LLM
+            log.info(`========== STAGE 4: MESSAGE PREPARATION ==========`);
+            const messagePreparationStartTime = Date.now();
+            const preparedMessages = await this.stages.messagePreparation.execute({
+                messages: input.messages,
+                context,
+                systemPrompt: input.options?.systemPrompt,
+                options: modelSelection.options
+            });
+            this.updateStageMetrics('messagePreparation', messagePreparationStartTime);
+            log.info(`Prepared ${preparedMessages.messages.length} messages for LLM, tools enabled: ${useTools}`);
+
+            // Setup streaming handler if streaming is enabled and callback provided
+            // Check if streaming should be enabled based on several conditions
+            const streamEnabledInConfig = this.config.enableStreaming;
+            const streamFormatRequested = input.format === 'stream';
+            const streamRequestedInOptions = modelSelection.options.stream === true;
+            const streamCallbackAvailable = typeof streamCallback === 'function';
+
+            log.info(`[ChatPipeline] Request type info - Format: ${input.format || 'not specified'}, Options from pipelineInput: ${JSON.stringify({stream: input.options?.stream})}`);
+            log.info(`[ChatPipeline] Stream settings - config.enableStreaming: ${streamEnabledInConfig}, format parameter: ${input.format}, modelSelection.options.stream: ${modelSelection.options.stream}, streamCallback available: ${streamCallbackAvailable}`);
+
+            // IMPORTANT: Respect the existing stream option but with special handling for callbacks:
+            // 1. If a stream callback is available, streaming MUST be enabled for it to work
+            // 2. Otherwise, preserve the original stream setting from input options
+
+            // First, determine what the stream value should be based on various factors:
+            let shouldEnableStream = modelSelection.options.stream;
+
+            if (streamCallbackAvailable) {
+                // If we have a stream callback, we NEED to enable streaming
+                // This is critical for GET requests with EventSource
+                shouldEnableStream = true;
+                log.info(`[ChatPipeline] Stream callback available, enabling streaming`);
+            } else if (streamRequestedInOptions) {
+                // Stream was explicitly requested in options, honor that setting
+                log.info(`[ChatPipeline] Stream explicitly requested in options: ${streamRequestedInOptions}`);
+                shouldEnableStream = streamRequestedInOptions;
+            } else if (streamFormatRequested) {
+                // Format=stream parameter indicates streaming was requested
+                log.info(`[ChatPipeline] Stream format requested in parameters`);
+                shouldEnableStream = true;
+            } else {
+                // No explicit streaming indicators, use config default
+                log.info(`[ChatPipeline] No explicit stream settings, using config default: ${streamEnabledInConfig}`);
+                shouldEnableStream = streamEnabledInConfig;
+            }
+
+            // Set the final stream option
+            modelSelection.options.stream = shouldEnableStream;
+
+            log.info(`[ChatPipeline] Final streaming decision: stream=${shouldEnableStream}, will stream to client=${streamCallbackAvailable && shouldEnableStream}`);
+
+
+            // STAGE 5 & 6: Handle LLM completion and tool execution loop
+            log.info(`========== STAGE 5: LLM COMPLETION ==========`);
+            const llmStartTime = Date.now();
+            const completion = await this.stages.llmCompletion.execute({
+                messages: preparedMessages.messages,
+                options: modelSelection.options
+            });
+            this.updateStageMetrics('llmCompletion', llmStartTime);
+            log.info(`Received LLM response from model: ${completion.response.model}, provider: ${completion.response.provider}`);
+
+            // Handle streaming if enabled and available
+            // Use shouldEnableStream variable which contains our streaming decision
+            if (shouldEnableStream && completion.response.stream && streamCallback) {
+                // Setup stream handler that passes chunks through response processing
+                await completion.response.stream(async (chunk: StreamChunk) => {
+                    // Process the chunk text
+                    const processedChunk = await this.processStreamChunk(chunk, input.options);
+
+                    // Accumulate text for final response
+                    accumulatedText += processedChunk.text;
+
+                    // Forward to callback with original chunk data in case it contains additional information
+                    streamCallback(processedChunk.text, processedChunk.done, chunk);
+                });
+            }
+
+            // Process any tool calls in the response
+            let currentMessages = preparedMessages.messages;
+            let currentResponse = completion.response;
+            let toolCallIterations = 0;
+            const maxToolCallIterations = this.config.maxToolCallIterations;
+
+            // Check if tools were enabled in the options
+            const toolsEnabled = modelSelection.options.enableTools !== false;
+
+            // Log decision points for tool execution
+            log.info(`========== TOOL EXECUTION DECISION ==========`);
+            log.info(`Tools enabled in options: ${toolsEnabled}`);
+            log.info(`Response provider: ${currentResponse.provider || 'unknown'}`);
+            log.info(`Response model: ${currentResponse.model || 'unknown'}`);
+
+            // Enhanced tool_calls detection - check both direct property and getter
+            let hasToolCalls = false;
+
+            log.info(`[TOOL CALL DEBUG] Starting tool call detection for provider: ${currentResponse.provider}`);
+            // Check response object structure
+            log.info(`[TOOL CALL DEBUG] Response properties: ${Object.keys(currentResponse).join(', ')}`);
+
+            // Try to access tool_calls as a property
+            if ('tool_calls' in currentResponse) {
+                log.info(`[TOOL CALL DEBUG] tool_calls exists as a direct property`);
+                log.info(`[TOOL CALL DEBUG] tool_calls type: ${typeof currentResponse.tool_calls}`);
+
+                if (currentResponse.tool_calls && Array.isArray(currentResponse.tool_calls)) {
+                    log.info(`[TOOL CALL DEBUG] tool_calls is an array with length: ${currentResponse.tool_calls.length}`);
+                } else {
+                    log.info(`[TOOL CALL DEBUG] tool_calls is not an array or is empty: ${JSON.stringify(currentResponse.tool_calls)}`);
+                }
+            } else {
+                log.info(`[TOOL CALL DEBUG] tool_calls does not exist as a direct property`);
+            }
+
+            // First check the direct property
+            if (currentResponse.tool_calls && currentResponse.tool_calls.length > 0) {
+                hasToolCalls = true;
+                log.info(`Response has tool_calls property with ${currentResponse.tool_calls.length} tools`);
+                log.info(`Tool calls details: ${JSON.stringify(currentResponse.tool_calls)}`);
+            }
+            // Check if it might be a getter (for dynamic tool_calls collection)
+            else {
+                log.info(`[TOOL CALL DEBUG] Direct property check failed, trying getter approach`);
+                try {
+                    const toolCallsDesc = Object.getOwnPropertyDescriptor(currentResponse, 'tool_calls');
+
+                    if (toolCallsDesc) {
+                        log.info(`[TOOL CALL DEBUG] Found property descriptor for tool_calls: ${JSON.stringify({
+                            configurable: toolCallsDesc.configurable,
+                            enumerable: toolCallsDesc.enumerable,
+                            hasGetter: !!toolCallsDesc.get,
+                            hasSetter: !!toolCallsDesc.set
+                        })}`);
+                    } else {
+                        log.info(`[TOOL CALL DEBUG] No property descriptor found for tool_calls`);
+                    }
+
+                    if (toolCallsDesc && typeof toolCallsDesc.get === 'function') {
+                        log.info(`[TOOL CALL DEBUG] Attempting to call the tool_calls getter`);
+                        const dynamicToolCalls = toolCallsDesc.get.call(currentResponse);
+
+                        log.info(`[TOOL CALL DEBUG] Getter returned: ${JSON.stringify(dynamicToolCalls)}`);
+
+                        if (dynamicToolCalls && dynamicToolCalls.length > 0) {
+                            hasToolCalls = true;
+                            log.info(`Response has dynamic tool_calls with ${dynamicToolCalls.length} tools`);
+                            log.info(`Dynamic tool calls details: ${JSON.stringify(dynamicToolCalls)}`);
+                            // Ensure property is available for subsequent code
+                            currentResponse.tool_calls = dynamicToolCalls;
+                            log.info(`[TOOL CALL DEBUG] Updated currentResponse.tool_calls with dynamic values`);
+                        } else {
+                            log.info(`[TOOL CALL DEBUG] Getter returned no valid tool calls`);
+                        }
+                    } else {
+                        log.info(`[TOOL CALL DEBUG] No getter function found for tool_calls`);
+                    }
+                } catch (e: any) {
+                    log.error(`Error checking dynamic tool_calls: ${e}`);
+                    log.error(`[TOOL CALL DEBUG] Error details: ${e.stack || 'No stack trace'}`);
+                }
+            }
+
+            log.info(`Response has tool_calls: ${hasToolCalls ? 'true' : 'false'}`);
+            if (hasToolCalls && currentResponse.tool_calls) {
+                log.info(`[TOOL CALL DEBUG] Final tool_calls that will be used: ${JSON.stringify(currentResponse.tool_calls)}`);
+            }
+
+            // Tool execution loop
+            if (toolsEnabled && hasToolCalls && currentResponse.tool_calls) {
+                log.info(`========== STAGE 6: TOOL EXECUTION ==========`);
+                log.info(`Response contains ${currentResponse.tool_calls.length} tool calls, processing...`);
+
+                // Format tool calls for logging
+                log.info(`========== TOOL CALL DETAILS ==========`);
+                currentResponse.tool_calls.forEach((toolCall, idx) => {
+                    log.info(`Tool call ${idx + 1}: name=${toolCall.function?.name || 'unknown'}, id=${toolCall.id || 'no-id'}`);
+                    log.info(`Arguments: ${toolCall.function?.arguments || '{}'}`);
+                });
+
+                // Keep track of whether we're in a streaming response
+                const isStreaming = shouldEnableStream && streamCallback;
+                let streamingPaused = false;
+
+                // If streaming was enabled, send an update to the user
+                if (isStreaming && streamCallback) {
+                    streamingPaused = true;
+                    // Send a dedicated message with a specific type for tool execution
+                    streamCallback('', false, {
+                        text: '',
+                        done: false,
+                        toolExecution: {
+                            type: 'start',
+                            tool: {
+                                name: 'tool_execution',
+                                arguments: {}
+                            }
+                        }
+                    });
+                }
+
+                while (toolCallIterations < maxToolCallIterations) {
+                    toolCallIterations++;
+                    log.info(`========== TOOL ITERATION ${toolCallIterations}/${maxToolCallIterations} ==========`);
+
+                    // Create a copy of messages before tool execution
+                    const previousMessages = [...currentMessages];
+
+                    try {
+                        const toolCallingStartTime = Date.now();
+                        log.info(`========== PIPELINE TOOL EXECUTION FLOW ==========`);
+                        log.info(`About to call toolCalling.execute with ${currentResponse.tool_calls.length} tool calls`);
+                        log.info(`Tool calls being passed to stage: ${JSON.stringify(currentResponse.tool_calls)}`);
+
+                        const toolCallingResult = await this.stages.toolCalling.execute({
+                            response: currentResponse,
+                            messages: currentMessages,
+                            options: modelSelection.options
+                        });
+                        this.updateStageMetrics('toolCalling', toolCallingStartTime);
+
+                        log.info(`ToolCalling stage execution complete, got result with needsFollowUp: ${toolCallingResult.needsFollowUp}`);
+
+                        // Update messages with tool results
+                        currentMessages = toolCallingResult.messages;
+
+                        // Log the tool results for debugging
+                        const toolResultMessages = currentMessages.filter(
+                            msg => msg.role === 'tool' && !previousMessages.includes(msg)
+                        );
+
+                        log.info(`========== TOOL EXECUTION RESULTS ==========`);
+                        log.info(`Received ${toolResultMessages.length} tool results`);
+                        toolResultMessages.forEach((msg, idx) => {
+                            log.info(`Tool result ${idx + 1}: tool_call_id=${msg.tool_call_id}, content=${msg.content}`);
+                            log.info(`Tool result status: ${msg.content.startsWith('Error:') ? 'ERROR' : 'SUCCESS'}`);
+                            log.info(`Tool result for: ${this.getToolNameFromToolCallId(currentMessages, msg.tool_call_id || '')}`);
+
+                            // If streaming, show tool executions to the user
+                            if (isStreaming && streamCallback) {
+                                // For each tool result, format a readable message for the user
+                                const toolName = this.getToolNameFromToolCallId(currentMessages, msg.tool_call_id || '');
+
+                                // Create a structured tool result message
+                                // The client will receive this structured data and can display it properly
+                                try {
+                                    // Parse the result content if it's JSON
+                                    let parsedContent = msg.content;
+                                    try {
+                                        // Check if the content is JSON
+                                        if (msg.content.trim().startsWith('{') || msg.content.trim().startsWith('[')) {
+                                            parsedContent = JSON.parse(msg.content);
+                                        }
+                                    } catch (e) {
+                                        // If parsing fails, keep the original content
+                                        log.info(`Could not parse tool result as JSON: ${e}`);
+                                    }
+
+                                    // Send the structured tool result directly so the client has the raw data
+                                    streamCallback('', false, {
+                                        text: '',
+                                        done: false,
+                                        toolExecution: {
+                                            type: 'complete',
+                                            tool: {
+                                                name: toolName,
+                                                arguments: {}
+                                            },
+                                            result: parsedContent
+                                        }
+                                    });
+
+                                    // No longer need to send formatted text version
+                                    // The client should use the structured data instead
+                                } catch (err) {
+                                    log.error(`Error sending structured tool result: ${err}`);
+                                    // Use structured format here too instead of falling back to text format
+                                    streamCallback('', false, {
+                                        text: '',
+                                        done: false,
+                                        toolExecution: {
+                                            type: 'complete',
+                                            tool: {
+                                                name: toolName || 'unknown',
+                                                arguments: {}
+                                            },
+                                            result: msg.content
+                                        }
+                                    });
+                                }
+                            }
+                        });
+
+                        // Check if we need another LLM completion for tool results
+                        if (toolCallingResult.needsFollowUp) {
+                            log.info(`========== TOOL FOLLOW-UP REQUIRED ==========`);
+                            log.info('Tool execution complete, sending results back to LLM');
+
+                            // Ensure messages are properly formatted
+                            this.validateToolMessages(currentMessages);
+
+                            // If streaming, show progress to the user
+                            if (isStreaming && streamCallback) {
+                                streamCallback('', false, {
+                                    text: '',
+                                    done: false,
+                                    toolExecution: {
+                                        type: 'update',
+                                        tool: {
+                                            name: 'tool_processing',
+                                            arguments: {}
+                                        }
+                                    }
+                                });
+                            }
+
+                            // Extract tool execution status information for Ollama feedback
+                            let toolExecutionStatus;
+
+                            if (currentResponse.provider === 'Ollama') {
+                                // Collect tool execution status from the tool results
+                                toolExecutionStatus = toolResultMessages.map(msg => {
+                                    // Determine if this was a successful tool call
+                                    const isError = msg.content.startsWith('Error:');
+                                    return {
+                                        toolCallId: msg.tool_call_id || '',
+                                        name: msg.name || 'unknown',
+                                        success: !isError,
+                                        result: msg.content,
+                                        error: isError ? msg.content.substring(7) : undefined
+                                    };
+                                });
+
+                                log.info(`Created tool execution status for Ollama: ${toolExecutionStatus.length} entries`);
+                                toolExecutionStatus.forEach((status, idx) => {
+                                    log.info(`Tool status ${idx + 1}: ${status.name} - ${status.success ? 'success' : 'failed'}`);
+                                });
+                            }
+
+                            // Generate a new completion with the updated messages
+                            const followUpStartTime = Date.now();
+
+                            // Log messages being sent to LLM for tool follow-up
+                            log.info(`========== SENDING TOOL RESULTS TO LLM FOR FOLLOW-UP ==========`);
+                            log.info(`Total messages being sent: ${currentMessages.length}`);
+                            // Log the most recent messages (last 3) for clarity
+                            const recentMessages = currentMessages.slice(-3);
+                            recentMessages.forEach((msg, idx) => {
+                                const position = currentMessages.length - recentMessages.length + idx;
+                                log.info(`Message ${position} (${msg.role}): ${msg.content?.substring(0, 100)}${msg.content?.length > 100 ? '...' : ''}`);
+                                if (msg.tool_calls) {
+                                    log.info(`  Has ${msg.tool_calls.length} tool calls`);
+                                }
+                                if (msg.tool_call_id) {
+                                    log.info(`  Tool call ID: ${msg.tool_call_id}`);
+                                }
+                            });
+
+                            log.info(`LLM follow-up request options: ${JSON.stringify({
+                                model: modelSelection.options.model,
+                                enableTools: true,
+                                stream: modelSelection.options.stream,
+                                provider: currentResponse.provider
+                            })}`);
+
+                            const followUpCompletion = await this.stages.llmCompletion.execute({
+                                messages: currentMessages,
+                                options: {
+                                    ...modelSelection.options,
+                                    // Ensure tool support is still enabled for follow-up requests
+                                    enableTools: true,
+                                    // Preserve original streaming setting for tool execution follow-ups
+                                    stream: modelSelection.options.stream,
+                                    // Add tool execution status for Ollama provider
+                                    ...(currentResponse.provider === 'Ollama' ? { toolExecutionStatus } : {})
+                                }
+                            });
+                            this.updateStageMetrics('llmCompletion', followUpStartTime);
+
+                            // Log the follow-up response from the LLM
+                            log.info(`========== LLM FOLLOW-UP RESPONSE RECEIVED ==========`);
+                            log.info(`Follow-up response model: ${followUpCompletion.response.model}, provider: ${followUpCompletion.response.provider}`);
+                            log.info(`Follow-up response text: ${followUpCompletion.response.text?.substring(0, 150)}${followUpCompletion.response.text?.length > 150 ? '...' : ''}`);
+                            log.info(`Follow-up contains tool calls: ${!!followUpCompletion.response.tool_calls && followUpCompletion.response.tool_calls.length > 0}`);
+                            if (followUpCompletion.response.tool_calls && followUpCompletion.response.tool_calls.length > 0) {
+                                log.info(`Follow-up has ${followUpCompletion.response.tool_calls.length} new tool calls`);
+                            }
+
+                            // Update current response for the next iteration
+                            currentResponse = followUpCompletion.response;
+
+                            // Check if we need to continue the tool calling loop
+                            if (!currentResponse.tool_calls || currentResponse.tool_calls.length === 0) {
+                                log.info(`========== TOOL EXECUTION COMPLETE ==========`);
+                                log.info('No more tool calls, breaking tool execution loop');
+                                break;
+                            } else {
+                                log.info(`========== ADDITIONAL TOOL CALLS DETECTED ==========`);
+                                log.info(`Next iteration has ${currentResponse.tool_calls.length} more tool calls`);
+                                // Log the next set of tool calls
+                                currentResponse.tool_calls.forEach((toolCall, idx) => {
+                                    log.info(`Next tool call ${idx + 1}: name=${toolCall.function?.name || 'unknown'}, id=${toolCall.id || 'no-id'}`);
+                                    log.info(`Arguments: ${toolCall.function?.arguments || '{}'}`);
+                                });
+                            }
+                        } else {
+                            log.info(`========== TOOL EXECUTION COMPLETE ==========`);
+                            log.info('No follow-up needed, breaking tool execution loop');
+                            break;
+                        }
+                    } catch (error: any) {
+                        log.info(`========== TOOL EXECUTION ERROR ==========`);
+                        log.error(`Error in tool execution: ${error.message || String(error)}`);
+
+                        // Add error message to the conversation if tool execution fails
+                        currentMessages.push({
+                            role: 'system',
+                            content: `Error executing tool: ${error.message || String(error)}. Please try a different approach.`
+                        });
+
+                        // If streaming, show error to the user
+                        if (isStreaming && streamCallback) {
+                            streamCallback('', false, {
+                                text: '',
+                                done: false,
+                                toolExecution: {
+                                    type: 'error',
+                                    tool: {
+                                        name: 'unknown',
+                                        arguments: {}
+                                    },
+                                    result: error.message || 'unknown error'
+                                }
+                            });
+                        }
+
+                        // For Ollama, create tool execution status with the error
+                        let toolExecutionStatus;
+                        if (currentResponse.provider === 'Ollama' && currentResponse.tool_calls) {
+                            // We need to create error statuses for all tool calls that failed
+                            toolExecutionStatus = currentResponse.tool_calls.map(toolCall => {
+                                return {
+                                    toolCallId: toolCall.id || '',
+                                    name: toolCall.function?.name || 'unknown',
+                                    success: false,
+                                    result: `Error: ${error.message || 'unknown error'}`,
+                                    error: error.message || 'unknown error'
+                                };
+                            });
+
+                            log.info(`Created error tool execution status for Ollama: ${toolExecutionStatus.length} entries`);
+                        }
+
+                        // Make a follow-up request to the LLM with the error information
+                        const errorFollowUpCompletion = await this.stages.llmCompletion.execute({
+                            messages: currentMessages,
+                            options: {
+                                ...modelSelection.options,
+                                // Preserve streaming for error follow-up
+                                stream: modelSelection.options.stream,
+                                // For Ollama, include tool execution status
+                                ...(currentResponse.provider === 'Ollama' ? { toolExecutionStatus } : {})
+                            }
+                        });
+
+                        // Log the error follow-up response from the LLM
+                        log.info(`========== ERROR FOLLOW-UP RESPONSE RECEIVED ==========`);
+                        log.info(`Error follow-up response model: ${errorFollowUpCompletion.response.model}, provider: ${errorFollowUpCompletion.response.provider}`);
+                        log.info(`Error follow-up response text: ${errorFollowUpCompletion.response.text?.substring(0, 150)}${errorFollowUpCompletion.response.text?.length > 150 ? '...' : ''}`);
+                        log.info(`Error follow-up contains tool calls: ${!!errorFollowUpCompletion.response.tool_calls && errorFollowUpCompletion.response.tool_calls.length > 0}`);
+
+                        // Update current response and break the tool loop
+                        currentResponse = errorFollowUpCompletion.response;
+                        break;
+                    }
+                }
+
+                if (toolCallIterations >= maxToolCallIterations) {
+                    log.info(`========== MAXIMUM TOOL ITERATIONS REACHED ==========`);
+                    log.error(`Reached maximum tool call iterations (${maxToolCallIterations}), terminating loop`);
+
+                    // Add a message to inform the LLM that we've reached the limit
+                    currentMessages.push({
+                        role: 'system',
+                        content: `Maximum tool call iterations (${maxToolCallIterations}) reached. Please provide your best response with the information gathered so far.`
+                    });
+
+                    // If streaming, inform the user about iteration limit
+                    if (isStreaming && streamCallback) {
+                        streamCallback(`[Reached maximum of ${maxToolCallIterations} tool calls. Finalizing response...]\n\n`, false);
+                    }
+
+                    // For Ollama, create a status about reaching max iterations
+                    let toolExecutionStatus;
+                    if (currentResponse.provider === 'Ollama' && currentResponse.tool_calls) {
+                        // Create a special status message about max iterations
+                        toolExecutionStatus = [
+                            {
+                                toolCallId: 'max-iterations',
+                                name: 'system',
+                                success: false,
+                                result: `Maximum tool call iterations (${maxToolCallIterations}) reached.`,
+                                error: `Reached the maximum number of allowed tool calls (${maxToolCallIterations}). Please provide a final response with the information gathered so far.`
+                            }
+                        ];
+
+                        log.info(`Created max iterations status for Ollama`);
+                    }
+
+                    // Make a final request to get a summary response
+                    const finalFollowUpCompletion = await this.stages.llmCompletion.execute({
+                        messages: currentMessages,
+                        options: {
+                            ...modelSelection.options,
+                            enableTools: false, // Disable tools for the final response
+                            // Preserve streaming setting for max iterations response
+                            stream: modelSelection.options.stream,
+                            // For Ollama, include tool execution status
+                            ...(currentResponse.provider === 'Ollama' ? { toolExecutionStatus } : {})
+                        }
+                    });
+
+                    // Update the current response
+                    currentResponse = finalFollowUpCompletion.response;
+                }
+
+                // If streaming was paused for tool execution, resume it now with the final response
+                if (isStreaming && streamCallback && streamingPaused) {
+                    // First log for debugging
+                    const responseText = currentResponse.text || "";
+                    log.info(`Resuming streaming with final response: ${responseText.length} chars`);
+
+                    if (responseText.length > 0) {
+                        // Resume streaming with the final response text
+                        // This is where we send the definitive done:true signal with the complete content
+                        streamCallback(responseText, true);
+                        log.info(`Sent final response with done=true signal and text content`);
+                    } else {
+                        // For Anthropic, sometimes text is empty but response is in stream
+                        if ((currentResponse.provider === 'Anthropic' || currentResponse.provider === 'OpenAI') && currentResponse.stream) {
+                            log.info(`Detected empty response text for ${currentResponse.provider} provider with stream, sending stream content directly`);
+                            // For Anthropic/OpenAI with stream mode, we need to stream the final response
+                            if (currentResponse.stream) {
+                                await currentResponse.stream(async (chunk: StreamChunk) => {
+                                    // Process the chunk
+                                    const processedChunk = await this.processStreamChunk(chunk, input.options);
+
+                                    // Forward to callback
+                                    streamCallback(
+                                        processedChunk.text,
+                                        processedChunk.done || chunk.done || false,
+                                        chunk
+                                    );
+                                });
+                                log.info(`Completed streaming final ${currentResponse.provider} response after tool execution`);
+                            }
+                        } else {
+                            // Empty response with done=true as fallback
+                            streamCallback('', true);
+                            log.info(`Sent empty final response with done=true signal`);
+                        }
+                    }
+                }
+            } else if (toolsEnabled) {
+                log.info(`========== NO TOOL CALLS DETECTED ==========`);
+                log.info(`LLM response did not contain any tool calls, skipping tool execution`);
+
+                // Handle streaming for responses without tool calls
+                if (shouldEnableStream && streamCallback) {
+                    log.info(`Sending final streaming response without tool calls: ${currentResponse.text.length} chars`);
+
+                    // Send the final response with done=true to complete the streaming
+                    streamCallback(currentResponse.text, true);
+
+                    log.info(`Sent final non-tool response with done=true signal`);
+                }
+            }
+
+            // Process the final response
+            log.info(`========== FINAL RESPONSE PROCESSING ==========`);
+            const responseProcessingStartTime = Date.now();
+            const processedResponse = await this.stages.responseProcessing.execute({
+                response: currentResponse,
+                options: modelSelection.options
+            });
+            this.updateStageMetrics('responseProcessing', responseProcessingStartTime);
+            log.info(`Final response processed, returning to user (${processedResponse.text.length} chars)`);
+
+            // Return the final response to the user
+            // The ResponseProcessingStage returns {text}, not {response}
+            // So we update our currentResponse with the processed text
+            currentResponse.text = processedResponse.text;
+
+            log.info(`========== PIPELINE COMPLETE ==========`);
+            return currentResponse;
+        } catch (error: any) {
+            log.info(`========== PIPELINE ERROR ==========`);
+            log.error(`Error in chat pipeline: ${error.message || String(error)}`);
+            throw error;
+        }
+    }
+
+    /**
+     * Helper method to get an LLM service for query processing
+     */
+    private async getLLMService(): Promise<LLMServiceInterface | null> {
+        try {
+            const aiServiceManager = await import('../ai_service_manager.js').then(module => module.default);
+            return aiServiceManager.getService();
+        } catch (error: any) {
+            log.error(`Error getting LLM service: ${error.message || String(error)}`);
+            return null;
+        }
+    }
+
+    /**
+     * Process a stream chunk through the response processing stage
+     */
+    private async processStreamChunk(chunk: StreamChunk, options?: any): Promise<StreamChunk> {
+        try {
+            // Only process non-empty chunks
+            if (!chunk.text) return chunk;
+
+            // Create a minimal response object for the processor
+            const miniResponse = {
+                text: chunk.text,
+                model: 'streaming',
+                provider: 'streaming'
+            };
+
+            // Process the chunk text
+            const processed = await this.stages.responseProcessing.execute({
+                response: miniResponse,
+                options: options
+            });
+
+            // Return processed chunk
+            return {
+                ...chunk,
+                text: processed.text
+            };
+        } catch (error) {
+            // On error, return original chunk
+            log.error(`Error processing stream chunk: ${error}`);
+            return chunk;
+        }
+    }
+
+    /**
+     * Update metrics for a pipeline stage
+     */
+    private updateStageMetrics(stageName: string, startTime: number) {
+        if (!this.config.enableMetrics) return;
+
+        const executionTime = Date.now() - startTime;
+        const metrics = this.metrics.stageMetrics[stageName];
+
+        metrics.totalExecutions++;
+        metrics.averageExecutionTime =
+            (metrics.averageExecutionTime * (metrics.totalExecutions - 1) + executionTime) /
+            metrics.totalExecutions;
+    }
+
+    /**
+     * Get the current pipeline metrics
+     */
+    getMetrics(): PipelineMetrics {
+        return this.metrics;
+    }
+
+    /**
+     * Reset pipeline metrics
+     */
+    resetMetrics(): void {
+        this.metrics.totalExecutions = 0;
+        this.metrics.averageExecutionTime = 0;
+
+        Object.keys(this.metrics.stageMetrics).forEach(stageName => {
+            this.metrics.stageMetrics[stageName] = {
+                totalExecutions: 0,
+                averageExecutionTime: 0
+            };
+        });
+    }
+
+    /**
+     * Find tool name from tool call ID by looking at previous assistant messages
+     */
+    private getToolNameFromToolCallId(messages: Message[], toolCallId: string): string {
+        if (!toolCallId) return 'unknown';
+
+        // Look for assistant messages with tool_calls
+        for (let i = messages.length - 1; i >= 0; i--) {
+            const message = messages[i];
+            if (message.role === 'assistant' && message.tool_calls) {
+                // Find the tool call with the matching ID
+                const toolCall = message.tool_calls.find(tc => tc.id === toolCallId);
+                if (toolCall && toolCall.function && toolCall.function.name) {
+                    return toolCall.function.name;
+                }
+            }
+        }
+
+        return 'unknown';
+    }
+
+    /**
+     * Validate tool messages to ensure they're properly formatted
+     */
+    private validateToolMessages(messages: Message[]): void {
+        for (let i = 0; i < messages.length; i++) {
+            const message = messages[i];
+
+            // Ensure tool messages have required fields
+            if (message.role === 'tool') {
+                if (!message.tool_call_id) {
+                    log.info(`Tool message missing tool_call_id, adding placeholder`);
+                    message.tool_call_id = `tool_${i}`;
+                }
+
+                // Content should be a string
+                if (typeof message.content !== 'string') {
+                    log.info(`Tool message content is not a string, converting`);
+                    try {
+                        message.content = JSON.stringify(message.content);
+                    } catch (e) {
+                        message.content = String(message.content);
+                    }
+                }
+            }
+        }
+    }
+}
diff --git a/src/services/llm/pipeline/interfaces.ts b/src/services/llm/pipeline/interfaces.ts
new file mode 100644
index 000000000..13c39414e
--- /dev/null
+++ b/src/services/llm/pipeline/interfaces.ts
@@ -0,0 +1,166 @@
+import type { Message, ChatCompletionOptions, ChatResponse, StreamChunk } from '../ai_interface.js';
+import type { LLMServiceInterface } from '../interfaces/agent_tool_interfaces.js';
+
+/**
+ * Base interface for pipeline input
+ */
+export interface PipelineInput {
+    [key: string]: unknown;
+}
+
+/**
+ * Pipeline configuration options
+ */
+export interface ChatPipelineConfig {
+    /**
+     * Whether to enable streaming support
+     */
+    enableStreaming: boolean;
+
+    /**
+     * Whether to enable performance metrics
+     */
+    enableMetrics: boolean;
+
+    /**
+     * Maximum number of tool call iterations
+     */
+    maxToolCallIterations: number;
+}
+
+/**
+ * Pipeline metrics for monitoring performance
+ */
+export interface PipelineMetrics {
+    totalExecutions: number;
+    averageExecutionTime: number;
+    stageMetrics: Record<string, StageMetrics>;
+}
+
+/**
+ * Metrics for an individual pipeline stage
+ */
+export interface StageMetrics {
+    totalExecutions: number;
+    averageExecutionTime: number;
+}
+
+/**
+ * Callback for handling stream chunks
+ * @param text The text chunk to append to the UI
+ * @param isDone Whether this is the final chunk
+ * @param originalChunk The original chunk with all metadata for custom handling
+ */
+export type StreamCallback = (text: string, isDone: boolean, originalChunk?: StreamChunk) => Promise<void> | void;
+
+/**
+ * Common input for all chat-related pipeline stages
+ */
+export interface ChatPipelineInput extends PipelineInput {
+    messages: Message[];
+    options: ChatCompletionOptions;
+    noteId?: string;
+    query?: string;
+    showThinking?: boolean;
+    streamCallback?: StreamCallback;
+}
+
+/**
+ * Options for vector search operations
+ */
+export interface VectorSearchOptions {
+    maxResults?: number;
+    useEnhancedQueries?: boolean;
+    threshold?: number;
+    llmService?: LLMServiceInterface;
+}
+
+/**
+ * Input for vector search pipeline stage
+ */
+export interface VectorSearchInput extends PipelineInput {
+    query: string;
+    noteId?: string | null;
+    options?: VectorSearchOptions;
+}
+
+/**
+ * Base interface for pipeline stage output
+ */
+export interface PipelineOutput {
+    [key: string]: unknown;
+}
+
+/**
+ * Interface for the pipeline stage that performs context extraction
+ */
+export interface ContextExtractionInput extends PipelineInput {
+    noteId: string;
+    query: string;
+    useSmartContext?: boolean;
+}
+
+/**
+ * Interface for the pipeline stage that performs semantic context extraction
+ */
+export interface SemanticContextExtractionInput extends PipelineInput {
+    noteId: string;
+    query: string;
+    maxResults?: number;
+    messages?: Message[];
+}
+
+/**
+ * Interface for the pipeline stage that performs message preparation
+ */
+export interface MessagePreparationInput extends PipelineInput {
+    messages: Message[];
+    context?: string;
+    systemPrompt?: string;
+    options: ChatCompletionOptions;
+}
+
+/**
+ * Interface for the pipeline stage that performs model selection
+ */
+export interface ModelSelectionInput extends PipelineInput {
+    options: ChatCompletionOptions;
+    query?: string;
+    contentLength?: number;
+}
+
+/**
+ * Interface for the pipeline stage that performs LLM completion
+ */
+export interface LLMCompletionInput extends PipelineInput {
+    messages: Message[];
+    options: ChatCompletionOptions;
+    provider?: string;
+}
+
+/**
+ * Interface for the pipeline stage that performs response processing
+ */
+export interface ResponseProcessingInput extends PipelineInput {
+    response: ChatResponse;
+    options: ChatCompletionOptions;
+}
+
+/**
+ * Interface for the pipeline stage that handles tool execution
+ */
+export interface ToolExecutionInput extends PipelineInput {
+    response: ChatResponse;
+    messages: Message[];
+    options: ChatCompletionOptions;
+    maxIterations?: number;
+    streamCallback?: StreamCallback;
+}
+
+/**
+ * Base interface for a pipeline stage
+ */
+export interface PipelineStage<TInput extends PipelineInput, TOutput extends PipelineOutput> {
+    name: string;
+    execute(input: TInput): Promise<TOutput>;
+}
diff --git a/src/services/llm/pipeline/interfaces/message_formatter.ts b/src/services/llm/pipeline/interfaces/message_formatter.ts
new file mode 100644
index 000000000..98a20f223
--- /dev/null
+++ b/src/services/llm/pipeline/interfaces/message_formatter.ts
@@ -0,0 +1,226 @@
+import type { Message } from '../../ai_interface.js';
+import { MESSAGE_FORMATTER_TEMPLATES, PROVIDER_IDENTIFIERS } from '../../constants/formatter_constants.js';
+
+/**
+ * Interface for message formatters that handle provider-specific message formatting
+ */
+export interface MessageFormatter {
+    /**
+     * Format messages with system prompt and context in provider-specific way
+     * @param messages Original messages
+     * @param systemPrompt Optional system prompt to override
+     * @param context Optional context to include
+     * @param preserveSystemPrompt Optional flag to preserve existing system prompt
+     * @returns Formatted messages optimized for the specific provider
+     */
+    formatMessages(messages: Message[], systemPrompt?: string, context?: string, preserveSystemPrompt?: boolean): Message[];
+}
+
+/**
+ * Base message formatter with common functionality
+ */
+export abstract class BaseMessageFormatter implements MessageFormatter {
+    /**
+     * Format messages with system prompt and context
+     * Each provider should override this method with their specific formatting strategy
+     */
+    abstract formatMessages(messages: Message[], systemPrompt?: string, context?: string, preserveSystemPrompt?: boolean): Message[];
+
+    /**
+     * Helper method to extract existing system message from messages
+     */
+    protected getSystemMessage(messages: Message[]): Message | undefined {
+        return messages.find(msg => msg.role === 'system');
+    }
+
+    /**
+     * Helper method to create a copy of messages without system message
+     */
+    protected getMessagesWithoutSystem(messages: Message[]): Message[] {
+        return messages.filter(msg => msg.role !== 'system');
+    }
+}
+
+/**
+ * OpenAI-specific message formatter
+ * Optimizes message format for OpenAI models (GPT-3.5, GPT-4, etc.)
+ */
+export class OpenAIMessageFormatter extends BaseMessageFormatter {
+    formatMessages(messages: Message[], systemPrompt?: string, context?: string, preserveSystemPrompt?: boolean): Message[] {
+        const formattedMessages: Message[] = [];
+
+        // OpenAI performs best with system message first, then context as a separate system message
+        // or appended to the original system message
+
+        // Handle system message
+        const existingSystem = this.getSystemMessage(messages);
+
+        if (preserveSystemPrompt && existingSystem) {
+            // Use the existing system message
+            formattedMessages.push(existingSystem);
+        } else if (systemPrompt || existingSystem) {
+            const systemContent = systemPrompt || existingSystem?.content || '';
+            formattedMessages.push({
+                role: 'system',
+                content: systemContent
+            });
+        }
+
+        // Add context as a system message with clear instruction
+        if (context) {
+            formattedMessages.push({
+                role: 'system',
+                content: MESSAGE_FORMATTER_TEMPLATES.OPENAI.CONTEXT_INSTRUCTION + context
+            });
+        }
+
+        // Add remaining messages (excluding system)
+        formattedMessages.push(...this.getMessagesWithoutSystem(messages));
+
+        return formattedMessages;
+    }
+}
+
+/**
+ * Anthropic-specific message formatter
+ * Optimizes message format for Claude models
+ */
+export class AnthropicMessageFormatter extends BaseMessageFormatter {
+    formatMessages(messages: Message[], systemPrompt?: string, context?: string, preserveSystemPrompt?: boolean): Message[] {
+        const formattedMessages: Message[] = [];
+
+        // Anthropic performs best with a specific XML-like format for context and system instructions
+
+        // Create system message with combined prompt and context if any
+        let systemContent = '';
+        const existingSystem = this.getSystemMessage(messages);
+
+        if (preserveSystemPrompt && existingSystem) {
+            systemContent = existingSystem.content;
+        } else if (systemPrompt || existingSystem) {
+            systemContent = systemPrompt || existingSystem?.content || '';
+        }
+
+        // For Claude, wrap context in XML tags for clear separation
+        if (context) {
+            systemContent += MESSAGE_FORMATTER_TEMPLATES.ANTHROPIC.CONTEXT_START + context + MESSAGE_FORMATTER_TEMPLATES.ANTHROPIC.CONTEXT_END;
+        }
+
+        // Add system message if we have content
+        if (systemContent) {
+            formattedMessages.push({
+                role: 'system',
+                content: systemContent
+            });
+        }
+
+        // Add remaining messages (excluding system)
+        formattedMessages.push(...this.getMessagesWithoutSystem(messages));
+
+        return formattedMessages;
+    }
+}
+
+/**
+ * Ollama-specific message formatter
+ * Optimizes message format for open-source models
+ */
+export class OllamaMessageFormatter extends BaseMessageFormatter {
+    formatMessages(messages: Message[], systemPrompt?: string, context?: string, preserveSystemPrompt?: boolean): Message[] {
+        const formattedMessages: Message[] = [];
+
+        // Ollama format is closer to raw prompting and typically works better with
+        // context embedded in system prompt rather than as separate messages
+
+        // Build comprehensive system prompt
+        let systemContent = '';
+        const existingSystem = this.getSystemMessage(messages);
+
+        if (systemPrompt || existingSystem) {
+            systemContent = systemPrompt || existingSystem?.content || '';
+        }
+
+        // Add context to system prompt
+        if (context) {
+            systemContent += MESSAGE_FORMATTER_TEMPLATES.OLLAMA.REFERENCE_INFORMATION + context;
+        }
+
+        // Add system message if we have content
+        if (systemContent) {
+            formattedMessages.push({
+                role: 'system',
+                content: systemContent
+            });
+        }
+
+        // Add remaining messages (excluding system)
+        formattedMessages.push(...this.getMessagesWithoutSystem(messages));
+
+        return formattedMessages;
+    }
+}
+
+/**
+ * Default message formatter when provider is unknown
+ */
+export class DefaultMessageFormatter extends BaseMessageFormatter {
+    formatMessages(messages: Message[], systemPrompt?: string, context?: string, preserveSystemPrompt?: boolean): Message[] {
+        const formattedMessages: Message[] = [];
+
+        // Handle system message
+        const existingSystem = this.getSystemMessage(messages);
+
+        if (preserveSystemPrompt && existingSystem) {
+            formattedMessages.push(existingSystem);
+        } else if (systemPrompt || existingSystem) {
+            const systemContent = systemPrompt || existingSystem?.content || '';
+            formattedMessages.push({
+                role: 'system',
+                content: systemContent
+            });
+        }
+
+        // Add context as a user message
+        if (context) {
+            formattedMessages.push({
+                role: 'user',
+                content: MESSAGE_FORMATTER_TEMPLATES.DEFAULT.CONTEXT_INSTRUCTION + context
+            });
+        }
+
+        // Add user/assistant messages
+        formattedMessages.push(...this.getMessagesWithoutSystem(messages));
+
+        return formattedMessages;
+    }
+}
+
+/**
+ * Factory for creating the appropriate message formatter based on provider
+ */
+export class MessageFormatterFactory {
+    private static formatters: Record<string, MessageFormatter> = {
+        [PROVIDER_IDENTIFIERS.OPENAI]: new OpenAIMessageFormatter(),
+        [PROVIDER_IDENTIFIERS.ANTHROPIC]: new AnthropicMessageFormatter(),
+        [PROVIDER_IDENTIFIERS.OLLAMA]: new OllamaMessageFormatter(),
+        [PROVIDER_IDENTIFIERS.DEFAULT]: new DefaultMessageFormatter()
+    };
+
+    /**
+     * Get the appropriate formatter for a provider
+     * @param provider Provider name
+     * @returns Message formatter for that provider
+     */
+    static getFormatter(provider: string): MessageFormatter {
+        return this.formatters[provider] || this.formatters[PROVIDER_IDENTIFIERS.DEFAULT];
+    }
+
+    /**
+     * Register a custom formatter for a provider
+     * @param provider Provider name
+     * @param formatter Custom formatter implementation
+     */
+    static registerFormatter(provider: string, formatter: MessageFormatter): void {
+        this.formatters[provider] = formatter;
+    }
+}
diff --git a/src/services/llm/pipeline/pipeline_stage.ts b/src/services/llm/pipeline/pipeline_stage.ts
new file mode 100644
index 000000000..68b2daf89
--- /dev/null
+++ b/src/services/llm/pipeline/pipeline_stage.ts
@@ -0,0 +1,36 @@
+import type { PipelineInput, PipelineOutput, PipelineStage } from './interfaces.js';
+import log from '../../log.js';
+
+/**
+ * Abstract base class for pipeline stages
+ */
+export abstract class BasePipelineStage<TInput extends PipelineInput, TOutput extends PipelineOutput> implements PipelineStage<TInput, TOutput> {
+    name: string;
+
+    constructor(name: string) {
+        this.name = name;
+    }
+
+    /**
+     * Execute the pipeline stage
+     */
+    async execute(input: TInput): Promise<TOutput> {
+        try {
+            log.info(`Executing pipeline stage: ${this.name}`);
+            const startTime = Date.now();
+            const result = await this.process(input);
+            const endTime = Date.now();
+            log.info(`Pipeline stage ${this.name} completed in ${endTime - startTime}ms`);
+            return result;
+        } catch (error: any) {
+            log.error(`Error in pipeline stage ${this.name}: ${error.message}`);
+            throw error;
+        }
+    }
+
+    /**
+     * Process the input and produce output
+     * This is the main method that each pipeline stage must implement
+     */
+    protected abstract process(input: TInput): Promise<TOutput>;
+}
diff --git a/src/services/llm/pipeline/stages/agent_tools_context_stage.ts b/src/services/llm/pipeline/stages/agent_tools_context_stage.ts
new file mode 100644
index 000000000..10f460c4e
--- /dev/null
+++ b/src/services/llm/pipeline/stages/agent_tools_context_stage.ts
@@ -0,0 +1,60 @@
+import { BasePipelineStage } from '../pipeline_stage.js';
+import type { PipelineInput } from '../interfaces.js';
+import aiServiceManager from '../../ai_service_manager.js';
+import log from '../../../log.js';
+
+export interface AgentToolsContextInput {
+    noteId?: string;
+    query?: string;
+    showThinking?: boolean;
+}
+
+export interface AgentToolsContextOutput {
+    context: string;
+    noteId: string;
+    query: string;
+}
+
+/**
+ * Pipeline stage for adding LLM agent tools context
+ */
+export class AgentToolsContextStage {
+    constructor() {
+        log.info('AgentToolsContextStage initialized');
+    }
+
+    /**
+     * Execute the agent tools context stage
+     */
+    async execute(input: AgentToolsContextInput): Promise<AgentToolsContextOutput> {
+        return this.process(input);
+    }
+
+    /**
+     * Process the input and add agent tools context
+     */
+    protected async process(input: AgentToolsContextInput): Promise<AgentToolsContextOutput> {
+        const noteId = input.noteId || 'global';
+        const query = input.query || '';
+        const showThinking = !!input.showThinking;
+
+        log.info(`AgentToolsContextStage: Getting agent tools context for noteId=${noteId}, query="${query.substring(0, 30)}...", showThinking=${showThinking}`);
+
+        try {
+            // Use the AI service manager to get agent tools context
+            const context = await aiServiceManager.getAgentToolsContext(noteId, query, showThinking);
+
+            log.info(`AgentToolsContextStage: Generated agent tools context (${context.length} chars)`);
+
+            return {
+                context,
+                noteId,
+                query
+            };
+        } catch (error: unknown) {
+            const errorMessage = error instanceof Error ? error.message : String(error);
+            log.error(`AgentToolsContextStage: Error getting agent tools context: ${errorMessage}`);
+            throw error;
+        }
+    }
+}
diff --git a/src/services/llm/pipeline/stages/context_extraction_stage.ts b/src/services/llm/pipeline/stages/context_extraction_stage.ts
new file mode 100644
index 000000000..95d7620e2
--- /dev/null
+++ b/src/services/llm/pipeline/stages/context_extraction_stage.ts
@@ -0,0 +1,72 @@
+import { BasePipelineStage } from '../pipeline_stage.js';
+import type { ContextExtractionInput } from '../interfaces.js';
+import aiServiceManager from '../../ai_service_manager.js';
+import log from '../../../log.js';
+
+/**
+ * Context Extraction Pipeline Stage
+ */
+
+export interface ContextExtractionOutput {
+    context: string;
+    noteId: string;
+    query: string;
+}
+
+/**
+ * Pipeline stage for extracting context from notes
+ */
+export class ContextExtractionStage {
+    constructor() {
+        log.info('ContextExtractionStage initialized');
+    }
+
+    /**
+     * Execute the context extraction stage
+     */
+    async execute(input: ContextExtractionInput): Promise<ContextExtractionOutput> {
+        return this.process(input);
+    }
+
+    /**
+     * Process the input and extract context
+     */
+    protected async process(input: ContextExtractionInput): Promise<ContextExtractionOutput> {
+        const { useSmartContext = true } = input;
+        const noteId = input.noteId || 'global';
+        const query = input.query || '';
+
+        log.info(`ContextExtractionStage: Extracting context for noteId=${noteId}, query="${query.substring(0, 30)}..."`);
+
+        try {
+            let context = '';
+
+            // Get enhanced context from the context service
+            const contextService = aiServiceManager.getContextService();
+            const llmService = aiServiceManager.getService();
+
+            if (contextService) {
+                // Use unified context service to get smart context
+                context = await contextService.processQuery(
+                    query,
+                    llmService,
+                    { contextNoteId: noteId }
+                ).then(result => result.context);
+
+                log.info(`ContextExtractionStage: Generated enhanced context (${context.length} chars)`);
+            } else {
+                log.info('ContextExtractionStage: Context service not available, using default context');
+            }
+
+            return {
+                context,
+                noteId,
+                query
+            };
+        } catch (error: unknown) {
+            const errorMessage = error instanceof Error ? error.message : String(error);
+            log.error(`ContextExtractionStage: Error extracting context: ${errorMessage}`);
+            throw error;
+        }
+    }
+}
diff --git a/src/services/llm/pipeline/stages/llm_completion_stage.ts b/src/services/llm/pipeline/stages/llm_completion_stage.ts
new file mode 100644
index 000000000..7dd6984c8
--- /dev/null
+++ b/src/services/llm/pipeline/stages/llm_completion_stage.ts
@@ -0,0 +1,206 @@
+import { BasePipelineStage } from '../pipeline_stage.js';
+import type { LLMCompletionInput } from '../interfaces.js';
+import type { ChatCompletionOptions, ChatResponse, StreamChunk } from '../../ai_interface.js';
+import aiServiceManager from '../../ai_service_manager.js';
+import toolRegistry from '../../tools/tool_registry.js';
+import log from '../../../log.js';
+
+/**
+ * Pipeline stage for LLM completion with enhanced streaming support
+ */
+export class LLMCompletionStage extends BasePipelineStage<LLMCompletionInput, { response: ChatResponse }> {
+    constructor() {
+        super('LLMCompletion');
+    }
+
+    /**
+     * Generate LLM completion using the AI service
+     *
+     * This enhanced version supports better streaming by forwarding raw provider data
+     * and ensuring consistent handling of stream options.
+     */
+    protected async process(input: LLMCompletionInput): Promise<{ response: ChatResponse }> {
+        const { messages, options } = input;
+
+        // Add detailed logging about the input messages, particularly useful for tool follow-ups
+        log.info(`========== LLM COMPLETION STAGE - INPUT MESSAGES ==========`);
+        log.info(`Total input messages: ${messages.length}`);
+
+        // Log if tool messages are present (used for follow-ups)
+        const toolMessages = messages.filter(m => m.role === 'tool');
+        if (toolMessages.length > 0) {
+            log.info(`Contains ${toolMessages.length} tool result messages - likely a tool follow-up request`);
+        }
+
+        // Log the last few messages to understand conversation context
+        const lastMessages = messages.slice(-3);
+        lastMessages.forEach((msg, idx) => {
+            const msgPosition = messages.length - lastMessages.length + idx;
+            log.info(`Message ${msgPosition} (${msg.role}): ${msg.content?.substring(0, 150)}${msg.content?.length > 150 ? '...' : ''}`);
+            if (msg.tool_calls) {
+                log.info(`  Contains ${msg.tool_calls.length} tool calls`);
+            }
+            if (msg.tool_call_id) {
+                log.info(`  Tool call ID: ${msg.tool_call_id}`);
+            }
+        });
+
+        // Log completion options
+        log.info(`LLM completion options: ${JSON.stringify({
+            model: options.model || 'default',
+            temperature: options.temperature,
+            enableTools: options.enableTools,
+            stream: options.stream,
+            hasToolExecutionStatus: !!options.toolExecutionStatus
+        })}`);
+
+        // Create a deep copy of options to avoid modifying the original
+        const updatedOptions: ChatCompletionOptions = JSON.parse(JSON.stringify(options));
+
+        // Handle stream option explicitly
+        if (options.stream !== undefined) {
+            updatedOptions.stream = options.stream === true;
+            log.info(`[LLMCompletionStage] Stream explicitly set to: ${updatedOptions.stream}`);
+        }
+
+        // Add capture of raw provider data for streaming
+        if (updatedOptions.stream) {
+            // Add a function to capture raw provider data in stream chunks
+            const originalStreamCallback = updatedOptions.streamCallback;
+            updatedOptions.streamCallback = async (text, done, rawProviderData) => {
+                // Create an enhanced chunk with the raw provider data
+                const enhancedChunk = {
+                    text,
+                    done,
+                    // Include raw provider data if available
+                    raw: rawProviderData
+                };
+
+                // Call the original callback if provided
+                if (originalStreamCallback) {
+                    return originalStreamCallback(text, done, enhancedChunk);
+                }
+            };
+        }
+
+        // Check if tools should be enabled
+        if (updatedOptions.enableTools !== false) {
+            const toolDefinitions = toolRegistry.getAllToolDefinitions();
+            if (toolDefinitions.length > 0) {
+                updatedOptions.enableTools = true;
+                updatedOptions.tools = toolDefinitions;
+                log.info(`Adding ${toolDefinitions.length} tools to LLM request`);
+            }
+        }
+
+        // Determine which provider to use
+        let selectedProvider = '';
+        if (updatedOptions.providerMetadata?.provider) {
+            selectedProvider = updatedOptions.providerMetadata.provider;
+            log.info(`Using provider ${selectedProvider} from metadata for model ${updatedOptions.model}`);
+        }
+
+        log.info(`Generating LLM completion, provider: ${selectedProvider || 'auto'}, model: ${updatedOptions?.model || 'default'}`);
+
+        // Use specific provider if available
+        if (selectedProvider && aiServiceManager.isProviderAvailable(selectedProvider)) {
+            const service = aiServiceManager.getService(selectedProvider);
+            log.info(`[LLMCompletionStage] Using specific service for ${selectedProvider}`);
+
+            // Generate completion and wrap with enhanced stream handling
+            const response = await service.generateChatCompletion(messages, updatedOptions);
+
+            // If streaming is enabled, enhance the stream method
+            if (response.stream && typeof response.stream === 'function' && updatedOptions.stream) {
+                const originalStream = response.stream;
+
+                // Replace the stream method with an enhanced version that captures and forwards raw data
+                response.stream = async (callback) => {
+                    return originalStream(async (chunk) => {
+                        // Forward the chunk with any additional provider-specific data
+                        // Create an enhanced chunk with provider info
+                        const enhancedChunk: StreamChunk = {
+                            ...chunk,
+                            // If the provider didn't include raw data, add minimal info
+                            raw: chunk.raw || {
+                                provider: selectedProvider,
+                                model: response.model
+                            }
+                        };
+                        return callback(enhancedChunk);
+                    });
+                };
+            }
+
+            // Add enhanced logging for debugging tool execution follow-ups
+            if (toolMessages.length > 0) {
+                if (response.tool_calls && response.tool_calls.length > 0) {
+                    log.info(`Response contains ${response.tool_calls.length} tool calls`);
+                    response.tool_calls.forEach((toolCall: any, idx: number) => {
+                        log.info(`Tool call ${idx + 1}: ${toolCall.function?.name || 'unnamed'}`);
+                        const args = typeof toolCall.function?.arguments === 'string'
+                            ? toolCall.function?.arguments
+                            : JSON.stringify(toolCall.function?.arguments);
+                        log.info(`Arguments: ${args?.substring(0, 100) || '{}'}`);
+                    });
+                } else {
+                    log.info(`Response contains no tool calls - plain text response`);
+                }
+
+                if (toolMessages.length > 0 && !response.tool_calls) {
+                    log.info(`This appears to be a final response after tool execution (no new tool calls)`);
+                } else if (toolMessages.length > 0 && response.tool_calls && response.tool_calls.length > 0) {
+                    log.info(`This appears to be a continued tool execution flow (tools followed by more tools)`);
+                }
+            }
+
+            return { response };
+        }
+
+        // Use auto-selection if no specific provider
+        log.info(`[LLMCompletionStage] Using auto-selected service`);
+        const response = await aiServiceManager.generateChatCompletion(messages, updatedOptions);
+
+        // Add similar stream enhancement for auto-selected provider
+        if (response.stream && typeof response.stream === 'function' && updatedOptions.stream) {
+            const originalStream = response.stream;
+            response.stream = async (callback) => {
+                return originalStream(async (chunk) => {
+                    // Create an enhanced chunk with provider info
+                    const enhancedChunk: StreamChunk = {
+                        ...chunk,
+                        raw: chunk.raw || {
+                            provider: response.provider,
+                            model: response.model
+                        }
+                    };
+                    return callback(enhancedChunk);
+                });
+            };
+        }
+
+        // Add enhanced logging for debugging tool execution follow-ups
+        if (toolMessages.length > 0) {
+            if (response.tool_calls && response.tool_calls.length > 0) {
+                log.info(`Response contains ${response.tool_calls.length} tool calls`);
+                response.tool_calls.forEach((toolCall: any, idx: number) => {
+                    log.info(`Tool call ${idx + 1}: ${toolCall.function?.name || 'unnamed'}`);
+                    const args = typeof toolCall.function?.arguments === 'string'
+                        ? toolCall.function?.arguments
+                        : JSON.stringify(toolCall.function?.arguments);
+                    log.info(`Arguments: ${args?.substring(0, 100) || '{}'}`);
+                });
+            } else {
+                log.info(`Response contains no tool calls - plain text response`);
+            }
+
+            if (toolMessages.length > 0 && !response.tool_calls) {
+                log.info(`This appears to be a final response after tool execution (no new tool calls)`);
+            } else if (toolMessages.length > 0 && response.tool_calls && response.tool_calls.length > 0) {
+                log.info(`This appears to be a continued tool execution flow (tools followed by more tools)`);
+            }
+        }
+
+        return { response };
+    }
+}
diff --git a/src/services/llm/pipeline/stages/message_preparation_stage.ts b/src/services/llm/pipeline/stages/message_preparation_stage.ts
new file mode 100644
index 000000000..753bc6a28
--- /dev/null
+++ b/src/services/llm/pipeline/stages/message_preparation_stage.ts
@@ -0,0 +1,63 @@
+import { BasePipelineStage } from '../pipeline_stage.js';
+import type { MessagePreparationInput } from '../interfaces.js';
+import type { Message } from '../../ai_interface.js';
+import { SYSTEM_PROMPTS } from '../../constants/llm_prompt_constants.js';
+import { MessageFormatterFactory } from '../interfaces/message_formatter.js';
+import toolRegistry from '../../tools/tool_registry.js';
+import log from '../../../log.js';
+
+/**
+ * Pipeline stage for preparing messages for LLM completion
+ */
+export class MessagePreparationStage extends BasePipelineStage<MessagePreparationInput, { messages: Message[] }> {
+    constructor() {
+        super('MessagePreparation');
+    }
+
+    /**
+     * Prepare messages for LLM completion, including system prompt and context
+     * This uses provider-specific formatters to optimize the message structure
+     */
+    protected async process(input: MessagePreparationInput): Promise<{ messages: Message[] }> {
+        const { messages, context, systemPrompt, options } = input;
+        
+        // Determine provider from model string if available (format: "provider:model")
+        let provider = 'default';
+        if (options?.model && options.model.includes(':')) {
+            const [providerName] = options.model.split(':');
+            provider = providerName;
+        }
+        
+        // Check if tools are enabled
+        const toolsEnabled = options?.enableTools === true;
+        
+        log.info(`Preparing messages for provider: ${provider}, context: ${!!context}, system prompt: ${!!systemPrompt}, tools: ${toolsEnabled}`);
+        
+        // Get appropriate formatter for this provider
+        const formatter = MessageFormatterFactory.getFormatter(provider);
+        
+        // Determine the system prompt to use
+        let finalSystemPrompt = systemPrompt || SYSTEM_PROMPTS.DEFAULT_SYSTEM_PROMPT;
+        
+        // If tools are enabled, enhance system prompt with tools guidance
+        if (toolsEnabled) {
+            const toolCount = toolRegistry.getAllTools().length;
+            const toolsPrompt = `You have access to ${toolCount} tools to help you respond. When you need information that might be in the user's notes, use the search_notes tool to find relevant content or the read_note tool to read a specific note by ID. Use tools when specific information is required rather than making assumptions.`;
+            
+            // Add tools guidance to system prompt
+            finalSystemPrompt = finalSystemPrompt + '\n\n' + toolsPrompt;
+            log.info(`Enhanced system prompt with tools guidance: ${toolCount} tools available`);
+        }
+        
+        // Format messages using provider-specific approach
+        const formattedMessages = formatter.formatMessages(
+            messages,
+            finalSystemPrompt,
+            context
+        );
+        
+        log.info(`Formatted ${messages.length} messages into ${formattedMessages.length} messages for provider: ${provider}`);
+        
+        return { messages: formattedMessages };
+    }
+}
diff --git a/src/services/llm/pipeline/stages/model_selection_stage.ts b/src/services/llm/pipeline/stages/model_selection_stage.ts
new file mode 100644
index 000000000..35634c210
--- /dev/null
+++ b/src/services/llm/pipeline/stages/model_selection_stage.ts
@@ -0,0 +1,296 @@
+import { BasePipelineStage } from '../pipeline_stage.js';
+import type { ModelSelectionInput } from '../interfaces.js';
+import type { ChatCompletionOptions } from '../../ai_interface.js';
+import type { ModelMetadata } from '../../providers/provider_options.js';
+import log from '../../../log.js';
+import options from '../../../options.js';
+import aiServiceManager from '../../ai_service_manager.js';
+import { SEARCH_CONSTANTS, MODEL_CAPABILITIES } from "../../constants/search_constants.js";
+/**
+ * Pipeline stage for selecting the appropriate LLM model
+ */
+export class ModelSelectionStage extends BasePipelineStage<ModelSelectionInput, { options: ChatCompletionOptions }> {
+    constructor() {
+        super('ModelSelection');
+    }
+    /**
+     * Select the appropriate model based on input complexity
+     */
+    protected async process(input: ModelSelectionInput): Promise<{ options: ChatCompletionOptions }> {
+        const { options: inputOptions, query, contentLength } = input;
+
+        // Log input options
+        log.info(`[ModelSelectionStage] Input options: ${JSON.stringify({
+            model: inputOptions?.model,
+            stream: inputOptions?.stream,
+            enableTools: inputOptions?.enableTools
+        })}`);
+        log.info(`[ModelSelectionStage] Stream option in input: ${inputOptions?.stream}, type: ${typeof inputOptions?.stream}`);
+
+        // Start with provided options or create a new object
+        const updatedOptions: ChatCompletionOptions = { ...(inputOptions || {}) };
+
+        // Preserve the stream option exactly as it was provided, including undefined state
+        // This is critical for ensuring the stream option propagates correctly down the pipeline
+        log.info(`[ModelSelectionStage] After copy, stream: ${updatedOptions.stream}, type: ${typeof updatedOptions.stream}`);
+
+        // If model already specified, don't override it
+        if (updatedOptions.model) {
+            // Check if the model has a provider prefix, which indicates legacy format
+            const modelParts = this.parseModelIdentifier(updatedOptions.model);
+
+            if (modelParts.provider) {
+                // Add provider metadata for backward compatibility
+                this.addProviderMetadata(updatedOptions, modelParts.provider, modelParts.model);
+                // Update the model to be just the model name without provider prefix
+                updatedOptions.model = modelParts.model;
+                log.info(`Using explicitly specified model: ${modelParts.model} from provider: ${modelParts.provider}`);
+            } else {
+                log.info(`Using explicitly specified model: ${updatedOptions.model}`);
+            }
+
+            log.info(`[ModelSelectionStage] Returning early with stream: ${updatedOptions.stream}`);
+            return { options: updatedOptions };
+        }
+
+        // Enable tools by default unless explicitly disabled
+        updatedOptions.enableTools = updatedOptions.enableTools !== false;
+
+        // Add tools if not already provided
+        if (updatedOptions.enableTools && (!updatedOptions.tools || updatedOptions.tools.length === 0)) {
+            try {
+                // Import tool registry and fetch tool definitions
+                const toolRegistry = (await import('../../tools/tool_registry.js')).default;
+                const toolDefinitions = toolRegistry.getAllToolDefinitions();
+
+                if (toolDefinitions.length > 0) {
+                    updatedOptions.tools = toolDefinitions;
+                    log.info(`Added ${toolDefinitions.length} tools to options`);
+                } else {
+                    // Try to initialize tools
+                    log.info('No tools found in registry, trying to initialize them');
+                    try {
+                        // Tools are already initialized in the AIServiceManager constructor
+                        // No need to initialize them again
+
+                        // Try again after initialization
+                        const reinitToolDefinitions = toolRegistry.getAllToolDefinitions();
+                        updatedOptions.tools = reinitToolDefinitions;
+                        log.info(`After initialization, added ${reinitToolDefinitions.length} tools to options`);
+                    } catch (initError: any) {
+                        log.error(`Failed to initialize tools: ${initError.message}`);
+                    }
+                }
+            } catch (error: any) {
+                log.error(`Error loading tools: ${error.message}`);
+            }
+        }
+
+        // Get default provider and model based on precedence
+        let defaultProvider = 'openai';
+        let defaultModelName = 'gpt-3.5-turbo';
+
+        try {
+            // Get provider precedence list
+            const providerPrecedence = await options.getOption('aiProviderPrecedence');
+            if (providerPrecedence) {
+                // Parse provider precedence list
+                let providers = [];
+                if (providerPrecedence.includes(',')) {
+                    providers = providerPrecedence.split(',').map(p => p.trim());
+                } else if (providerPrecedence.startsWith('[') && providerPrecedence.endsWith(']')) {
+                    providers = JSON.parse(providerPrecedence);
+                } else {
+                    providers = [providerPrecedence];
+                }
+
+                // Check for first available provider
+                if (providers.length > 0) {
+                    const firstProvider = providers[0];
+                    defaultProvider = firstProvider;
+
+                    // Get provider-specific default model
+                    if (firstProvider === 'openai') {
+                        const model = await options.getOption('openaiDefaultModel');
+                        if (model) defaultModelName = model;
+                    } else if (firstProvider === 'anthropic') {
+                        const model = await options.getOption('anthropicDefaultModel');
+                        if (model) defaultModelName = model;
+                    } else if (firstProvider === 'ollama') {
+                        const model = await options.getOption('ollamaDefaultModel');
+                        if (model) {
+                            defaultModelName = model;
+
+                            // Enable tools for all Ollama models
+                            // The Ollama API will handle models that don't support tool calling
+                            log.info(`Using Ollama model ${model} with tool calling enabled`);
+                            updatedOptions.enableTools = true;
+                        }
+                    }
+                }
+            }
+        } catch (error) {
+            // If any error occurs, use the fallback default
+            log.error(`Error determining default model: ${error}`);
+        }
+
+        // Determine query complexity
+        let queryComplexity = 'low';
+        if (query) {
+            // Simple heuristic: longer queries or those with complex terms indicate higher complexity
+            const complexityIndicators = [
+                'explain', 'analyze', 'compare', 'evaluate', 'synthesize',
+                'summarize', 'elaborate', 'investigate', 'research', 'debate'
+            ];
+
+            const hasComplexTerms = complexityIndicators.some(term => query.toLowerCase().includes(term));
+            const isLongQuery = query.length > 100;
+            const hasMultipleQuestions = (query.match(/\?/g) || []).length > 1;
+
+            if ((hasComplexTerms && isLongQuery) || hasMultipleQuestions) {
+                queryComplexity = 'high';
+            } else if (hasComplexTerms || isLongQuery) {
+                queryComplexity = 'medium';
+            }
+        }
+
+        // Check content length if provided
+        if (contentLength && contentLength > SEARCH_CONSTANTS.CONTEXT.CONTENT_LENGTH.MEDIUM_THRESHOLD) {
+            // For large content, favor more powerful models
+            queryComplexity = contentLength > SEARCH_CONSTANTS.CONTEXT.CONTENT_LENGTH.HIGH_THRESHOLD ? 'high' : 'medium';
+        }
+
+        // Set the model and add provider metadata
+        updatedOptions.model = defaultModelName;
+        this.addProviderMetadata(updatedOptions, defaultProvider, defaultModelName);
+
+        log.info(`Selected model: ${defaultModelName} from provider: ${defaultProvider} for query complexity: ${queryComplexity}`);
+        log.info(`[ModelSelectionStage] Final options: ${JSON.stringify({
+            model: updatedOptions.model,
+            stream: updatedOptions.stream,
+            provider: defaultProvider,
+            enableTools: updatedOptions.enableTools
+        })}`);
+
+        return { options: updatedOptions };
+    }
+
+    /**
+     * Helper to parse model identifier with provider prefix
+     * Handles legacy format "provider:model"
+     */
+    private parseModelIdentifier(modelId: string): { provider?: string, model: string } {
+        if (!modelId) return { model: '' };
+
+        const parts = modelId.split(':');
+        if (parts.length === 1) {
+            // No provider prefix
+            return { model: modelId };
+        } else {
+            // Extract provider and model
+            const provider = parts[0];
+            const model = parts.slice(1).join(':'); // Handle model names that might include :
+            return { provider, model };
+        }
+    }
+
+    /**
+     * Add provider metadata to the options based on model name
+     */
+    private addProviderMetadata(options: ChatCompletionOptions, provider: string, modelName: string): void {
+        // Check if we already have providerMetadata
+        if (options.providerMetadata) {
+            // If providerMetadata exists but not modelId, add the model name
+            if (!options.providerMetadata.modelId && modelName) {
+                options.providerMetadata.modelId = modelName;
+            }
+            return;
+        }
+
+        // If no provider could be determined, try to use precedence
+        let selectedProvider = provider;
+        if (!selectedProvider) {
+            // List of providers in precedence order
+            const providerPrecedence = ['anthropic', 'openai', 'ollama'];
+
+            // Find the first available provider
+            for (const p of providerPrecedence) {
+                if (aiServiceManager.isProviderAvailable(p)) {
+                    selectedProvider = p;
+                    break;
+                }
+            }
+        }
+
+        // Set the provider metadata in the options
+        if (selectedProvider) {
+            // Ensure the provider is one of the valid types
+            const validProvider = selectedProvider as 'openai' | 'anthropic' | 'ollama' | 'local';
+
+            options.providerMetadata = {
+                provider: validProvider,
+                modelId: modelName
+            };
+
+            // For backward compatibility, ensure model name is set without prefix
+            if (options.model && options.model.includes(':')) {
+                options.model = modelName || options.model.split(':')[1];
+            }
+
+            log.info(`Set provider metadata: provider=${selectedProvider}, model=${modelName}`);
+        }
+    }
+
+    /**
+     * Determine model based on provider precedence
+     */
+    private determineDefaultModel(input: ModelSelectionInput): string {
+        const providerPrecedence = ['anthropic', 'openai', 'ollama'];
+
+        // Use only providers that are available
+        const availableProviders = providerPrecedence.filter(provider =>
+            aiServiceManager.isProviderAvailable(provider));
+
+        if (availableProviders.length === 0) {
+            throw new Error('No AI providers are available');
+        }
+
+        // Get the first available provider and its default model
+        const defaultProvider = availableProviders[0] as 'openai' | 'anthropic' | 'ollama' | 'local';
+        let defaultModel = 'gpt-3.5-turbo'; // Use model from our constants
+
+        // Set provider metadata
+        if (!input.options.providerMetadata) {
+            input.options.providerMetadata = {
+                provider: defaultProvider,
+                modelId: defaultModel
+            };
+        }
+
+        log.info(`Selected default model ${defaultModel} from provider ${defaultProvider}`);
+        return defaultModel;
+    }
+
+    /**
+     * Get estimated context window for Ollama models
+     */
+    private getOllamaContextWindow(model: string): number {
+        // Try to find exact matches in MODEL_CAPABILITIES
+        if (model in MODEL_CAPABILITIES) {
+            return MODEL_CAPABILITIES[model as keyof typeof MODEL_CAPABILITIES].contextWindowTokens;
+        }
+
+        // Estimate based on model family
+        if (model.includes('llama3')) {
+            return MODEL_CAPABILITIES['gpt-4'].contextWindowTokens;
+        } else if (model.includes('llama2')) {
+            return MODEL_CAPABILITIES['default'].contextWindowTokens;
+        } else if (model.includes('mistral') || model.includes('mixtral')) {
+            return MODEL_CAPABILITIES['gpt-4'].contextWindowTokens;
+        } else if (model.includes('gemma')) {
+            return MODEL_CAPABILITIES['gpt-4'].contextWindowTokens;
+        } else {
+            return MODEL_CAPABILITIES['default'].contextWindowTokens;
+        }
+    }
+}
diff --git a/src/services/llm/pipeline/stages/response_processing_stage.ts b/src/services/llm/pipeline/stages/response_processing_stage.ts
new file mode 100644
index 000000000..94944815b
--- /dev/null
+++ b/src/services/llm/pipeline/stages/response_processing_stage.ts
@@ -0,0 +1,44 @@
+import { BasePipelineStage } from '../pipeline_stage.js';
+import type { ResponseProcessingInput } from '../interfaces.js';
+import type { ChatResponse } from '../../ai_interface.js';
+import log from '../../../log.js';
+
+/**
+ * Pipeline stage for processing LLM responses
+ */
+export class ResponseProcessingStage extends BasePipelineStage<ResponseProcessingInput, { text: string }> {
+    constructor() {
+        super('ResponseProcessing');
+    }
+
+    /**
+     * Process the LLM response
+     */
+    protected async process(input: ResponseProcessingInput): Promise<{ text: string }> {
+        const { response, options } = input;
+        log.info(`Processing LLM response from model: ${response.model}`);
+
+        // Perform any necessary post-processing on the response text
+        let text = response.text;
+
+        // For Markdown formatting, ensure code blocks are properly formatted
+        if (options?.showThinking && text.includes('thinking:')) {
+            // Extract and format thinking section
+            const thinkingMatch = text.match(/thinking:(.*?)(?=answer:|$)/s);
+            if (thinkingMatch) {
+                const thinking = thinkingMatch[1].trim();
+                text = text.replace(/thinking:.*?(?=answer:|$)/s, `**Thinking:** \n\n\`\`\`\n${thinking}\n\`\`\`\n\n`);
+            }
+        }
+
+        // Clean up response text
+        text = text.replace(/^\s*assistant:\s*/i, ''); // Remove leading "Assistant:" if present
+
+        // Log tokens if available for monitoring
+        if (response.usage) {
+            log.info(`Token usage - prompt: ${response.usage.promptTokens}, completion: ${response.usage.completionTokens}, total: ${response.usage.totalTokens}`);
+        }
+
+        return { text };
+    }
+}
diff --git a/src/services/llm/pipeline/stages/semantic_context_extraction_stage.ts b/src/services/llm/pipeline/stages/semantic_context_extraction_stage.ts
new file mode 100644
index 000000000..bf2cc8fd7
--- /dev/null
+++ b/src/services/llm/pipeline/stages/semantic_context_extraction_stage.ts
@@ -0,0 +1,70 @@
+import { BasePipelineStage } from '../pipeline_stage.js';
+import type { SemanticContextExtractionInput } from '../interfaces.js';
+import aiServiceManager from '../../ai_service_manager.js';
+import log from '../../../log.js';
+import { VectorSearchStage } from './vector_search_stage.js';
+import contextFormatter from '../../context/modules/context_formatter.js';
+import providerManager from '../../context/modules/provider_manager.js';
+import type { NoteSearchResult } from '../../interfaces/context_interfaces.js';
+import type { Message } from '../../ai_interface.js';
+import { SEARCH_CONSTANTS } from "../../constants/search_constants.js";
+
+/**
+ * Pipeline stage for extracting semantic context from notes
+ * This uses the new VectorSearchStage to find relevant content
+ */
+export class SemanticContextExtractionStage extends BasePipelineStage<SemanticContextExtractionInput, { context: string }> {
+    private vectorSearchStage: VectorSearchStage;
+
+    constructor() {
+        super('SemanticContextExtraction');
+        this.vectorSearchStage = new VectorSearchStage();
+    }
+
+    /**
+     * Extract semantic context based on a query
+     */
+    protected async process(input: SemanticContextExtractionInput): Promise<{ context: string }> {
+        const { noteId, query, maxResults = 5, messages = [] } = input;
+        log.info(`Extracting semantic context from note ${noteId}, query: ${query?.substring(0, 50)}...`);
+
+        try {
+            // Step 1: Use vector search stage to find relevant notes
+            const vectorSearchResult = await this.vectorSearchStage.execute({
+                query,
+                noteId,
+                options: {
+                    maxResults,
+                    useEnhancedQueries: true,
+                    threshold: SEARCH_CONSTANTS.VECTOR_SEARCH.DEFAULT_THRESHOLD,
+                    llmService: undefined // Let the vectorSearchStage use the default service
+                }
+            });
+
+            log.info(`Vector search found ${vectorSearchResult.searchResults.length} relevant notes`);
+
+            // If no results, return empty context
+            if (vectorSearchResult.searchResults.length === 0) {
+                log.info(`No relevant notes found for context extraction`);
+                return { context: "" };
+            }
+
+            // Step 2: Format search results into a context string
+            const provider = await providerManager.getPreferredEmbeddingProvider();
+            const providerId = provider?.name || 'default';
+
+            const context = await contextFormatter.buildContextFromNotes(
+                vectorSearchResult.searchResults,
+                query,
+                providerId,
+                messages
+            );
+
+            log.info(`Built context of ${context.length} chars from ${vectorSearchResult.searchResults.length} notes`);
+            return { context };
+        } catch (error) {
+            log.error(`Error extracting semantic context: ${error}`);
+            return { context: "" };
+        }
+    }
+}
diff --git a/src/services/llm/pipeline/stages/tool_calling_stage.ts b/src/services/llm/pipeline/stages/tool_calling_stage.ts
new file mode 100644
index 000000000..bab29fdf1
--- /dev/null
+++ b/src/services/llm/pipeline/stages/tool_calling_stage.ts
@@ -0,0 +1,578 @@
+import type { ChatResponse, Message } from '../../ai_interface.js';
+import log from '../../../log.js';
+import type { StreamCallback, ToolExecutionInput } from '../interfaces.js';
+import { BasePipelineStage } from '../pipeline_stage.js';
+import toolRegistry from '../../tools/tool_registry.js';
+import chatStorageService from '../../chat_storage_service.js';
+import aiServiceManager from '../../ai_service_manager.js';
+
+/**
+ * Pipeline stage for handling LLM tool calling
+ * This stage is responsible for:
+ * 1. Detecting tool calls in LLM responses
+ * 2. Executing the appropriate tools
+ * 3. Adding tool results back to the conversation
+ * 4. Determining if we need to make another call to the LLM
+ */
+export class ToolCallingStage extends BasePipelineStage<ToolExecutionInput, { response: ChatResponse, needsFollowUp: boolean, messages: Message[] }> {
+    constructor() {
+        super('ToolCalling');
+
+        // Preload the vectorSearchTool to ensure it's available when needed
+        this.preloadVectorSearchTool().catch(error => {
+            log.error(`Error preloading vector search tool: ${error.message}`);
+        });
+    }
+
+    /**
+     * Process the LLM response and execute any tool calls
+     */
+    protected async process(input: ToolExecutionInput): Promise<{ response: ChatResponse, needsFollowUp: boolean, messages: Message[] }> {
+        const { response, messages } = input;
+        const streamCallback = input.streamCallback as StreamCallback;
+
+        log.info(`========== TOOL CALLING STAGE ENTRY ==========`);
+        log.info(`Response provider: ${response.provider}, model: ${response.model || 'unknown'}`);
+
+        log.info(`LLM requested ${response.tool_calls?.length || 0} tool calls from provider: ${response.provider}`);
+
+        // Check if the response has tool calls
+        if (!response.tool_calls || response.tool_calls.length === 0) {
+            // No tool calls, return original response and messages
+            log.info(`No tool calls detected in response from provider: ${response.provider}`);
+            log.info(`===== EXITING TOOL CALLING STAGE: No tool_calls =====`);
+            return { response, needsFollowUp: false, messages };
+        }
+
+        // Log response details for debugging
+        if (response.text) {
+            log.info(`Response text: "${response.text.substring(0, 200)}${response.text.length > 200 ? '...' : ''}"`);
+        }
+
+        // Check if the registry has any tools
+        const availableTools = toolRegistry.getAllTools();
+        log.info(`Available tools in registry: ${availableTools.length}`);
+
+        // Log available tools for debugging
+        if (availableTools.length > 0) {
+            const availableToolNames = availableTools.map(t => t.definition.function.name).join(', ');
+            log.info(`Available tools: ${availableToolNames}`);
+        }
+
+        if (availableTools.length === 0) {
+            log.error(`No tools available in registry, cannot execute tool calls`);
+            // Try to initialize tools as a recovery step
+            try {
+                log.info('Attempting to initialize tools as recovery step');
+                // Tools are already initialized in the AIServiceManager constructor
+                // No need to initialize them again
+                log.info(`After recovery initialization: ${toolRegistry.getAllTools().length} tools available`);
+            } catch (error: any) {
+                log.error(`Failed to initialize tools in recovery step: ${error.message}`);
+            }
+        }
+
+        // Create a copy of messages to add the assistant message with tool calls
+        const updatedMessages = [...messages];
+
+        // Add the assistant message with the tool calls
+        updatedMessages.push({
+            role: 'assistant',
+            content: response.text || "",
+            tool_calls: response.tool_calls
+        });
+
+        // Execute each tool call and add results to messages
+        log.info(`========== STARTING TOOL EXECUTION ==========`);
+        log.info(`Executing ${response.tool_calls?.length || 0} tool calls in parallel`);
+
+        const executionStartTime = Date.now();
+
+        // First validate all tools before executing them
+        log.info(`Validating ${response.tool_calls?.length || 0} tools before execution`);
+        const validationResults = await Promise.all((response.tool_calls || []).map(async (toolCall) => {
+            try {
+                // Get the tool from registry
+                const tool = toolRegistry.getTool(toolCall.function.name);
+
+                if (!tool) {
+                    log.error(`Tool not found in registry: ${toolCall.function.name}`);
+                    return {
+                        toolCall,
+                        valid: false,
+                        tool: null,
+                        error: `Tool not found: ${toolCall.function.name}`
+                    };
+                }
+
+                // Validate the tool before execution
+                const isToolValid = await this.validateToolBeforeExecution(tool, toolCall.function.name);
+                if (!isToolValid) {
+                    throw new Error(`Tool '${toolCall.function.name}' failed validation before execution`);
+                }
+
+                return {
+                    toolCall,
+                    valid: true,
+                    tool,
+                    error: null
+                };
+            } catch (error: any) {
+                return {
+                    toolCall,
+                    valid: false,
+                    tool: null,
+                    error: error.message || String(error)
+                };
+            }
+        }));
+
+        // Execute the validated tools
+        const toolResults = await Promise.all(validationResults.map(async (validation, index) => {
+            const { toolCall, valid, tool, error } = validation;
+
+            try {
+                log.info(`========== TOOL CALL ${index + 1} OF ${response.tool_calls?.length || 0} ==========`);
+                log.info(`Tool call ${index + 1} received - Name: ${toolCall.function.name}, ID: ${toolCall.id || 'unknown'}`);
+
+                // Log parameters
+                const argsStr = typeof toolCall.function.arguments === 'string'
+                    ? toolCall.function.arguments
+                    : JSON.stringify(toolCall.function.arguments);
+                log.info(`Tool parameters: ${argsStr}`);
+
+                // If validation failed, throw the error
+                if (!valid || !tool) {
+                    throw new Error(error || `Unknown validation error for tool '${toolCall.function.name}'`);
+                }
+
+                log.info(`Tool validated successfully: ${toolCall.function.name}`);
+
+                // Parse arguments (handle both string and object formats)
+                let args;
+                // At this stage, arguments should already be processed by the provider-specific service
+                // But we still need to handle different formats just in case
+                if (typeof toolCall.function.arguments === 'string') {
+                    log.info(`Received string arguments in tool calling stage: ${toolCall.function.arguments.substring(0, 50)}...`);
+
+                    try {
+                        // Try to parse as JSON first
+                        args = JSON.parse(toolCall.function.arguments);
+                        log.info(`Parsed JSON arguments: ${Object.keys(args).join(', ')}`);
+                    } catch (e: unknown) {
+                        // If it's not valid JSON, try to check if it's a stringified object with quotes
+                        const errorMessage = e instanceof Error ? e.message : String(e);
+                        log.info(`Failed to parse arguments as JSON, trying alternative parsing: ${errorMessage}`);
+
+                        // Sometimes LLMs return stringified JSON with escaped quotes or incorrect quotes
+                        // Try to clean it up
+                        try {
+                            const cleaned = toolCall.function.arguments
+                                .replace(/^['"]|['"]$/g, '') // Remove surrounding quotes
+                                .replace(/\\"/g, '"')        // Replace escaped quotes
+                                .replace(/([{,])\s*'([^']+)'\s*:/g, '$1"$2":') // Replace single quotes around property names
+                                .replace(/([{,])\s*(\w+)\s*:/g, '$1"$2":');    // Add quotes around unquoted property names
+
+                            log.info(`Cleaned argument string: ${cleaned}`);
+                            args = JSON.parse(cleaned);
+                            log.info(`Successfully parsed cleaned arguments: ${Object.keys(args).join(', ')}`);
+                        } catch (cleanError: unknown) {
+                            // If all parsing fails, treat it as a text argument
+                            const cleanErrorMessage = cleanError instanceof Error ? cleanError.message : String(cleanError);
+                            log.info(`Failed to parse cleaned arguments: ${cleanErrorMessage}`);
+                            args = { text: toolCall.function.arguments };
+                            log.info(`Using text argument: ${args.text.substring(0, 50)}...`);
+                        }
+                    }
+                } else {
+                    // Arguments are already an object
+                    args = toolCall.function.arguments;
+                    log.info(`Using object arguments with keys: ${Object.keys(args).join(', ')}`);
+                }
+
+                // Execute the tool
+                log.info(`================ EXECUTING TOOL: ${toolCall.function.name} ================`);
+                log.info(`Tool parameters: ${Object.keys(args).join(', ')}`);
+                log.info(`Parameters values: ${Object.entries(args).map(([k, v]) => `${k}=${typeof v === 'string' ? v : JSON.stringify(v)}`).join(', ')}`);
+
+                // Emit tool start event if streaming is enabled
+                if (streamCallback) {
+                    const toolExecutionData = {
+                        action: 'start',
+                        tool: {
+                            name: toolCall.function.name,
+                            arguments: args
+                        },
+                        type: 'start' as const
+                    };
+
+                    // Don't wait for this to complete, but log any errors
+                    const callbackResult = streamCallback('', false, {
+                        text: '',
+                        done: false,
+                        toolExecution: toolExecutionData
+                    });
+                    if (callbackResult instanceof Promise) {
+                        callbackResult.catch((e: Error) => log.error(`Error sending tool execution start event: ${e.message}`));
+                    }
+                }
+
+                const executionStart = Date.now();
+                let result;
+                try {
+                    log.info(`Starting tool execution for ${toolCall.function.name}...`);
+                    result = await tool.execute(args);
+                    const executionTime = Date.now() - executionStart;
+                    log.info(`================ TOOL EXECUTION COMPLETED in ${executionTime}ms ================`);
+
+                    // Record this successful tool execution if there's a sessionId available
+                    if (input.options?.sessionId) {
+                        try {
+                            await chatStorageService.recordToolExecution(
+                                input.options.sessionId,
+                                toolCall.function.name,
+                                toolCall.id || `tool-${Date.now()}-${Math.random().toString(36).substring(2, 9)}`,
+                                args,
+                                result,
+                                undefined // No error for successful execution
+                            );
+                        } catch (storageError) {
+                            log.error(`Failed to record tool execution in chat storage: ${storageError}`);
+                        }
+                    }
+
+                    // Emit tool completion event if streaming is enabled
+                    if (streamCallback) {
+                        const toolExecutionData = {
+                            action: 'complete',
+                            tool: {
+                                name: toolCall.function.name,
+                                arguments: {} as Record<string, unknown>
+                            },
+                            result: typeof result === 'string' ? result : result as Record<string, unknown>,
+                            type: 'complete' as const
+                        };
+
+                        // Don't wait for this to complete, but log any errors
+                        const callbackResult = streamCallback('', false, {
+                            text: '',
+                            done: false,
+                            toolExecution: toolExecutionData
+                        });
+                        if (callbackResult instanceof Promise) {
+                            callbackResult.catch((e: Error) => log.error(`Error sending tool execution complete event: ${e.message}`));
+                        }
+                    }
+                } catch (execError: any) {
+                    const executionTime = Date.now() - executionStart;
+                    log.error(`================ TOOL EXECUTION FAILED in ${executionTime}ms: ${execError.message} ================`);
+
+                    // Record this failed tool execution if there's a sessionId available
+                    if (input.options?.sessionId) {
+                        try {
+                            await chatStorageService.recordToolExecution(
+                                input.options.sessionId,
+                                toolCall.function.name,
+                                toolCall.id || `tool-${Date.now()}-${Math.random().toString(36).substring(2, 9)}`,
+                                args,
+                                "", // No result for failed execution
+                                execError.message || String(execError)
+                            );
+                        } catch (storageError) {
+                            log.error(`Failed to record tool execution error in chat storage: ${storageError}`);
+                        }
+                    }
+
+                    // Emit tool error event if streaming is enabled
+                    if (streamCallback) {
+                        const toolExecutionData = {
+                            action: 'error',
+                            tool: {
+                                name: toolCall.function.name,
+                                arguments: {} as Record<string, unknown>
+                            },
+                            error: execError.message || String(execError),
+                            type: 'error' as const
+                        };
+
+                        // Don't wait for this to complete, but log any errors
+                        const callbackResult = streamCallback('', false, {
+                            text: '',
+                            done: false,
+                            toolExecution: toolExecutionData
+                        });
+                        if (callbackResult instanceof Promise) {
+                            callbackResult.catch((e: Error) => log.error(`Error sending tool execution error event: ${e.message}`));
+                        }
+                    }
+
+                    throw execError;
+                }
+
+                // Log execution result
+                const resultSummary = typeof result === 'string'
+                    ? `${result.substring(0, 100)}...`
+                    : `Object with keys: ${Object.keys(result).join(', ')}`;
+                const executionTime = Date.now() - executionStart;
+                log.info(`Tool execution completed in ${executionTime}ms - Result: ${resultSummary}`);
+
+                // Return result with tool call ID
+                return {
+                    toolCallId: toolCall.id,
+                    name: toolCall.function.name,
+                    result
+                };
+            } catch (error: any) {
+                log.error(`Error executing tool ${toolCall.function.name}: ${error.message || String(error)}`);
+
+                // Emit tool error event if not already handled in the try/catch above
+                // and if streaming is enabled
+                if (streamCallback && error.name !== "ExecutionError") {
+                    const toolExecutionData = {
+                        action: 'error',
+                        tool: {
+                            name: toolCall.function.name,
+                            arguments: {} as Record<string, unknown>
+                        },
+                        error: error.message || String(error),
+                        type: 'error' as const
+                    };
+
+                    // Don't wait for this to complete, but log any errors
+                    const callbackResult = streamCallback('', false, {
+                        text: '',
+                        done: false,
+                        toolExecution: toolExecutionData
+                    });
+                    if (callbackResult instanceof Promise) {
+                        callbackResult.catch((e: Error) => log.error(`Error sending tool execution error event: ${e.message}`));
+                    }
+                }
+
+                // Return error message as result
+                return {
+                    toolCallId: toolCall.id,
+                    name: toolCall.function.name,
+                    result: `Error: ${error.message || String(error)}`
+                };
+            }
+        }));
+
+        const totalExecutionTime = Date.now() - executionStartTime;
+        log.info(`========== TOOL EXECUTION COMPLETE ==========`);
+        log.info(`Completed execution of ${toolResults.length} tools in ${totalExecutionTime}ms`);
+
+        // Add each tool result to the messages array
+        const toolResultMessages: Message[] = [];
+
+        for (const result of toolResults) {
+            const { toolCallId, name, result: toolResult } = result;
+
+            // Format result for message
+            const resultContent = typeof toolResult === 'string'
+                ? toolResult
+                : JSON.stringify(toolResult, null, 2);
+
+            // Add a new message for the tool result
+            const toolMessage: Message = {
+                role: 'tool',
+                content: resultContent,
+                name: name,
+                tool_call_id: toolCallId
+            };
+
+            // Log detailed info about each tool result
+            log.info(`-------- Tool Result for ${name} (ID: ${toolCallId}) --------`);
+            log.info(`Result type: ${typeof toolResult}`);
+            log.info(`Result preview: ${resultContent.substring(0, 150)}${resultContent.length > 150 ? '...' : ''}`);
+            log.info(`Tool result status: ${resultContent.startsWith('Error:') ? 'ERROR' : 'SUCCESS'}`);
+
+            updatedMessages.push(toolMessage);
+            toolResultMessages.push(toolMessage);
+        }
+
+        // Log the decision about follow-up
+        log.info(`========== FOLLOW-UP DECISION ==========`);
+        const hasToolResults = toolResultMessages.length > 0;
+        const hasErrors = toolResultMessages.some(msg => msg.content.startsWith('Error:'));
+        const needsFollowUp = hasToolResults;
+
+        log.info(`Follow-up needed: ${needsFollowUp}`);
+        log.info(`Reasoning: ${hasToolResults ? 'Has tool results to process' : 'No tool results'} ${hasErrors ? ', contains errors' : ''}`);
+        log.info(`Total messages to return to pipeline: ${updatedMessages.length}`);
+        log.info(`Last 3 messages in conversation:`);
+        const lastMessages = updatedMessages.slice(-3);
+        lastMessages.forEach((msg, idx) => {
+            const position = updatedMessages.length - lastMessages.length + idx;
+            log.info(`Message ${position} (${msg.role}): ${msg.content?.substring(0, 100)}${msg.content?.length > 100 ? '...' : ''}`);
+        });
+
+        return {
+            response,
+            messages: updatedMessages,
+            needsFollowUp
+        };
+    }
+
+    /**
+     * Get or create a dependency required by tools
+     *
+     * @param dependencyType The type of dependency to get or create
+     * @param toolName The name of the tool requiring this dependency
+     * @returns The requested dependency or null if it couldn't be created
+     */
+    private async getOrCreateDependency(dependencyType: string, toolName: string): Promise<any> {
+        const aiServiceManager = require('../../../ai_service_manager.js').default;
+
+        try {
+            log.info(`Getting dependency '${dependencyType}' for tool '${toolName}'`);
+
+            // Check for specific dependency types
+            if (dependencyType === 'vectorSearchTool') {
+                // Try to get the existing vector search tool
+                let vectorSearchTool = aiServiceManager.getVectorSearchTool();
+
+                if (vectorSearchTool) {
+                    log.info(`Found existing vectorSearchTool dependency`);
+                    return vectorSearchTool;
+                }
+
+                // No existing tool, try to initialize it
+                log.info(`Dependency '${dependencyType}' not found, attempting initialization`);
+
+                // Get agent tools manager and initialize it
+                const agentTools = aiServiceManager.getAgentTools();
+                if (agentTools && typeof agentTools.initialize === 'function') {
+                    log.info('Initializing agent tools to create vectorSearchTool');
+                    try {
+                        // Force initialization to ensure it runs even if previously marked as initialized
+                        await agentTools.initialize(true);
+                        log.info('Agent tools initialized successfully');
+                    } catch (initError: any) {
+                        log.error(`Failed to initialize agent tools: ${initError.message}`);
+                        return null;
+                    }
+                } else {
+                    log.error('Agent tools manager not available');
+                    return null;
+                }
+
+                // Try getting the vector search tool again after initialization
+                vectorSearchTool = aiServiceManager.getVectorSearchTool();
+
+                if (vectorSearchTool) {
+                    log.info('Successfully created vectorSearchTool dependency');
+                    return vectorSearchTool;
+                } else {
+                    log.error('Failed to create vectorSearchTool dependency after initialization');
+                    return null;
+                }
+            }
+
+            // Add more dependency types as needed
+
+            // Unknown dependency type
+            log.error(`Unknown dependency type: ${dependencyType}`);
+            return null;
+        } catch (error: any) {
+            log.error(`Error getting or creating dependency '${dependencyType}': ${error.message}`);
+            return null;
+        }
+    }
+
+    /**
+     * Validate a tool before execution
+     * @param tool The tool to validate
+     * @param toolName The name of the tool
+     */
+    private async validateToolBeforeExecution(tool: any, toolName: string): Promise<boolean> {
+        try {
+            if (!tool) {
+                log.error(`Tool '${toolName}' not found or failed validation`);
+                return false;
+            }
+
+            // Validate execute method
+            if (!tool.execute || typeof tool.execute !== 'function') {
+                log.error(`Tool '${toolName}' is missing execute method`);
+                return false;
+            }
+
+            // For the search_notes tool specifically, check if vectorSearchTool is available
+            if (toolName === 'search_notes') {
+                try {
+                    // Use the imported aiServiceManager instead of dynamic import
+                    let vectorSearchTool = aiServiceManager.getVectorSearchTool();
+
+                    if (!vectorSearchTool) {
+                        log.error(`Tool '${toolName}' is missing dependency: vectorSearchTool - attempting to initialize`);
+
+                        // Try to initialize the agent tools
+                        try {
+                            // Get agent tools manager and initialize it if needed
+                            const agentTools = aiServiceManager.getAgentTools();
+                            if (agentTools && typeof agentTools.initialize === 'function') {
+                                log.info('Attempting to initialize agent tools');
+                                // Force initialization to ensure it runs even if previously initialized
+                                await agentTools.initialize(true);
+                            }
+
+                            // Try getting the vector search tool again
+                            vectorSearchTool = aiServiceManager.getVectorSearchTool();
+
+                            if (!vectorSearchTool) {
+                                log.error('Unable to initialize vectorSearchTool after initialization attempt');
+                                return false;
+                            }
+                            log.info('Successfully initialized vectorSearchTool');
+                        } catch (initError: any) {
+                            log.error(`Failed to initialize agent tools: ${initError.message}`);
+                            return false;
+                        }
+                    }
+
+                    if (!vectorSearchTool.searchNotes || typeof vectorSearchTool.searchNotes !== 'function') {
+                        log.error(`Tool '${toolName}' dependency vectorSearchTool is missing searchNotes method`);
+                        return false;
+                    }
+                } catch (error: any) {
+                    log.error(`Error validating dependencies for tool '${toolName}': ${error.message}`);
+                    return false;
+                }
+            }
+
+            // Add additional tool-specific validations here
+
+            return true;
+        } catch (error: any) {
+            log.error(`Error validating tool before execution: ${error.message}`);
+            return false;
+        }
+    }
+
+    /**
+     * Preload the vector search tool to ensure it's available before tool execution
+     */
+    private async preloadVectorSearchTool(): Promise<void> {
+        try {
+            log.info(`Preloading vector search tool...`);
+
+            // Get the agent tools and initialize them if needed
+            const agentTools = aiServiceManager.getAgentTools();
+            if (agentTools && typeof agentTools.initialize === 'function') {
+                await agentTools.initialize(true);
+                log.info(`Agent tools initialized during preloading`);
+            }
+
+            // Check if the vector search tool is available
+            const vectorSearchTool = aiServiceManager.getVectorSearchTool();
+            if (vectorSearchTool && typeof vectorSearchTool.searchNotes === 'function') {
+                log.info(`Vector search tool successfully preloaded`);
+            } else {
+                log.error(`Vector search tool not available after initialization`);
+            }
+        } catch (error: any) {
+            log.error(`Failed to preload vector search tool: ${error.message}`);
+        }
+    }
+}
diff --git a/src/services/llm/pipeline/stages/vector_search_stage.ts b/src/services/llm/pipeline/stages/vector_search_stage.ts
new file mode 100644
index 000000000..306b5079d
--- /dev/null
+++ b/src/services/llm/pipeline/stages/vector_search_stage.ts
@@ -0,0 +1,126 @@
+/**
+ * Vector Search Stage
+ *
+ * Part of the chat pipeline that handles finding semantically relevant notes
+ * using vector similarity search.
+ */
+
+import log from '../../../log.js';
+import vectorSearchService from '../../context/services/vector_search_service.js';
+import type { NoteSearchResult } from '../../interfaces/context_interfaces.js';
+import type { LLMServiceInterface } from '../../interfaces/agent_tool_interfaces.js';
+import { SEARCH_CONSTANTS } from '../../constants/search_constants.js';
+
+export interface VectorSearchInput {
+  query: string;
+  queries?: string[];
+  noteId?: string;
+  options?: {
+    maxResults?: number;
+    threshold?: number;
+    useEnhancedQueries?: boolean;
+    llmService?: LLMServiceInterface;
+  };
+}
+
+export interface VectorSearchOutput {
+  searchResults: NoteSearchResult[];
+  originalQuery: string;
+  noteId: string;
+}
+
+/**
+ * Pipeline stage for performing vector-based semantic search
+ */
+export class VectorSearchStage {
+  constructor() {
+    log.info('VectorSearchStage initialized');
+  }
+
+  /**
+   * Execute vector search to find relevant notes
+   */
+  async execute(input: VectorSearchInput): Promise<VectorSearchOutput> {
+    const {
+      query,
+      queries = [],
+      noteId = 'global',
+      options = {}
+    } = input;
+
+    const {
+      maxResults = SEARCH_CONSTANTS.VECTOR_SEARCH.DEFAULT_MAX_RESULTS,
+      threshold = SEARCH_CONSTANTS.VECTOR_SEARCH.DEFAULT_THRESHOLD,
+      useEnhancedQueries = false,
+      llmService = undefined
+    } = options;
+
+    // If queries array is provided, use multi-query search
+    if (queries && queries.length > 0) {
+      log.info(`VectorSearchStage: Searching with ${queries.length} queries`);
+      log.info(`Parameters: noteId=${noteId}, maxResults=${maxResults}, threshold=${threshold}`);
+
+      try {
+        // Use the new multi-query method
+        const searchResults = await vectorSearchService.findRelevantNotesMultiQuery(
+          queries,
+          noteId === 'global' ? null : noteId,
+          {
+            maxResults,
+            threshold,
+            llmService: llmService || null
+          }
+        );
+
+        log.info(`VectorSearchStage: Found ${searchResults.length} relevant notes from multi-query search`);
+
+        return {
+          searchResults,
+          originalQuery: query,
+          noteId
+        };
+      } catch (error) {
+        log.error(`Error in vector search stage multi-query: ${error}`);
+        // Return empty results on error
+        return {
+          searchResults: [],
+          originalQuery: query,
+          noteId
+        };
+      }
+    }
+
+    // Fallback to single query search
+    log.info(`VectorSearchStage: Searching for "${query.substring(0, 50)}..."`);
+    log.info(`Parameters: noteId=${noteId}, maxResults=${maxResults}, threshold=${threshold}`);
+
+    try {
+      // Find relevant notes using vector search service
+      const searchResults = await vectorSearchService.findRelevantNotes(
+        query,
+        noteId === 'global' ? null : noteId,
+        {
+          maxResults,
+          threshold,
+          llmService: llmService || null
+        }
+      );
+
+      log.info(`VectorSearchStage: Found ${searchResults.length} relevant notes`);
+
+      return {
+        searchResults,
+        originalQuery: query,
+        noteId
+      };
+    } catch (error) {
+      log.error(`Error in vector search stage: ${error}`);
+      // Return empty results on error
+      return {
+        searchResults: [],
+        originalQuery: query,
+        noteId
+      };
+    }
+  }
+}
diff --git a/src/services/llm/prompts/base_system_prompt.md b/src/services/llm/prompts/base_system_prompt.md
new file mode 100644
index 000000000..a353f21b7
--- /dev/null
+++ b/src/services/llm/prompts/base_system_prompt.md
@@ -0,0 +1,38 @@
+# TriliumNext Base System Prompt
+
+You are an AI assistant integrated into TriliumNext Notes, a powerful note-taking application that helps users build personal knowledge bases with features like:
+- Hierarchical note organization with support for placing notes in multiple locations
+- Rich text editing with WYSIWYG and Markdown support
+- Code notes with syntax highlighting
+- Note attributes for organization and scripting
+- Note versioning and history
+- Note encryption and protection
+- Relation maps for visualizing connections between notes
+- Synchronization between devices
+
+Your primary goal is to help users find information in their notes, answer questions based on their knowledge base, and provide assistance with using TriliumNext Notes features. Be sure to summarize the notes and include the title of the notes when providing a summary.
+
+IMPORTANT: When working with notes in TriliumNext:
+- Each note has a unique system ID (e.g., "abc123def456") which is different from its title
+- When tools require a noteId parameter, always use the system ID, not the title
+- Always use search tools first to find notes and get their IDs before performing operations on them
+- Using a note's title instead of its ID will cause operations to fail
+
+When responding to queries:
+- For complex queries, decompose them into simpler parts and address each one
+- When citing information from the user's notes, mention the note title (e.g., "According to your note titled 'Project Ideas'...")
+- Focus on the user's personal knowledge base first, then supplement with general knowledge if needed
+- Keep responses concise and directly relevant to the query
+- For general questions about the user's notes, provide a summary of all relevant notes found, including brief summaries of individual notes
+- For specific questions, provide detailed information from the user's notes that directly addresses the question
+- Always prioritize information from the user's notes over your own knowledge, as the user's notes are likely more up-to-date and personally relevant
+- For search requests, prioritize precision over recall - it's better to return the most relevant few notes than many marginally related ones
+- For organizational questions, offer concrete suggestions with examples rather than general advice
+- For analytical queries, structure your response to show relationships between notes and concepts
+- When you detect that a user's query relates to note organization, content structure, or knowledge management, proactively suggest relevant TriliumNext features they might not be aware of
+- If a query seems incomplete or ambiguous, ask clarifying questions rather than making assumptions
+- Respect privacy by focusing solely on the content explicitly shared - never speculate about other notes or information not directly referenced
+- When suggesting improvements to a user's note organization or structure, present these as optional enhancements rather than corrections
+- Maintain a helpful, knowledgeable tone focused on enhancing the user's knowledge management experience
+- Frame responses as collaborative assistance rather than authoritative instruction 
+- Instead of telling a user on what Notes they have, summarize the notes and include the title of the notes when providing a summary.
diff --git a/src/services/llm/prompts/providers/anthropic_tool_prompt.md b/src/services/llm/prompts/providers/anthropic_tool_prompt.md
new file mode 100644
index 000000000..765617bc1
--- /dev/null
+++ b/src/services/llm/prompts/providers/anthropic_tool_prompt.md
@@ -0,0 +1,39 @@
+```
+In this environment you have access to a set of tools that help you interact with TriliumNext Notes, a hierarchical note-taking application for building personal knowledge bases. You can use these tools to search notes, navigate the note hierarchy, analyze queries, and provide thoughtful responses based on the user's knowledge base.
+
+You can invoke tools by writing an "<function_calls>" block like the following as part of your reply to the user:
+<function_calls>
+<invoke name="$FUNCTION_NAME">
+<parameter name="$PARAMETER_NAME">$PARAMETER_VALUE</parameter>
+...
+</invoke>
+<invoke name="$FUNCTION_NAME2">
+...
+</invoke>
+</function_calls>
+
+String and scalar parameters should be specified as is, while lists and objects should use JSON format.
+
+[TOOL_DEFINITIONS]
+
+You are an AI assistant integrated into TriliumNext Notes, a powerful note-taking application that helps users build personal knowledge bases with features like:
+- Hierarchical note organization with support for placing notes in multiple locations
+- Rich text editing with WYSIWYG and Markdown support
+- Code notes with syntax highlighting
+- Note attributes for organization and scripting
+- Note versioning and history
+- Note encryption and protection
+- Relation maps for visualizing connections between notes
+- Synchronization between devices
+
+Your primary goal is to help users find information in their notes, answer questions based on their knowledge base, and provide assistance with using TriliumNext Notes features.
+
+When responding to queries:
+1. For complex queries, decompose them into simpler parts and address each one
+2. When citing information from the user's notes, mention the note title (e.g., "According to your note titled 'Project Ideas'...")
+3. Focus on the user's personal knowledge base first, then supplement with general knowledge if needed
+4. Keep responses concise and directly relevant to the query
+5. For general questions about the user's notes, provide a summary of all relevant notes found, including brief summaries of individual notes
+6. For specific questions, provide detailed information from the user's notes that directly addresses the question
+7. Always prioritize information from the user's notes over your own knowledge, as the user's notes are likely more up-to-date and personally relevant
+```
\ No newline at end of file
diff --git a/src/services/llm/prompts/providers/ollama_tool_prompt.md b/src/services/llm/prompts/providers/ollama_tool_prompt.md
new file mode 100644
index 000000000..c89760444
--- /dev/null
+++ b/src/services/llm/prompts/providers/ollama_tool_prompt.md
@@ -0,0 +1,35 @@
+```
+In this environment you have access to a set of tools that help you interact with TriliumNext Notes, a hierarchical note-taking application for building personal knowledge bases. You can use these tools to search notes, navigate the note hierarchy, analyze queries, and provide thoughtful responses based on the user's knowledge base.
+
+You can invoke tools by writing a JSON object with the following format:
+{
+<CURRENT_CURSOR_POSITION>
+  "tool_name": "$FUNCTION_NAME",
+  "parameters": {
+    "$PARAMETER_NAME": "$PARAMETER_VALUE"
+  }
+}
+
+[TOOL_DEFINITIONS]
+
+You are an AI assistant integrated into TriliumNext Notes, a powerful note-taking application that helps users build personal knowledge bases with features like:
+- Hierarchical note organization with support for placing notes in multiple locations
+- Rich text editing with WYSIWYG and Markdown support
+- Code notes with syntax highlighting
+- Note attributes for organization and scripting
+- Note versioning and history
+- Note encryption and protection
+- Relation maps for visualizing connections between notes
+- Synchronization between devices
+
+Your primary goal is to help users find information in their notes, answer questions based on their knowledge base, and provide assistance with using TriliumNext Notes features.
+
+When responding to queries:
+1. For complex queries, decompose them into simpler parts and address each one
+2. When citing information from the user's notes, mention the note title (e.g., "According to your note titled 'Project Ideas'...")
+3. Focus on the user's personal knowledge base first, then supplement with general knowledge if needed
+4. Keep responses concise and directly relevant to the query
+5. For general questions about the user's notes, provide a summary of all relevant notes found, including brief summaries of individual notes
+6. For specific questions, provide detailed information from the user's notes that directly addresses the question
+7. Always prioritize information from the user's notes over your own knowledge, as the user's notes are likely more up-to-date and personally relevant
+```
\ No newline at end of file
diff --git a/src/services/llm/prompts/providers/openai_tool_prompt.md b/src/services/llm/prompts/providers/openai_tool_prompt.md
new file mode 100644
index 000000000..3cd1a0b21
--- /dev/null
+++ b/src/services/llm/prompts/providers/openai_tool_prompt.md
@@ -0,0 +1,43 @@
+```
+In this environment you have access to a set of tools that help you interact with TriliumNext Notes, a hierarchical note-taking application for building personal knowledge bases. You can use these tools to search notes, navigate the note hierarchy, analyze queries, and provide thoughtful responses based on the user's knowledge base.
+
+You can invoke tools by writing an "<tool_calls>" block like the following as part of your reply to the user:
+<tool_calls>
+<tool_call id="$CALL_ID">
+<n>$FUNCTION_NAME</n>
+<parameters>
+{
+  "$PARAMETER_NAME": "$PARAMETER_VALUE"
+}
+</parameters>
+</tool_call>
+<tool_call id="$CALL_ID2">
+...
+</tool_call>
+</tool_calls>
+
+String and scalar parameters should be specified as is, while lists and objects should use JSON format.
+
+[TOOL_DEFINITIONS]
+
+You are an AI assistant integrated into TriliumNext Notes, a powerful note-taking application that helps users build personal knowledge bases with features like:
+- Hierarchical note organization with support for placing notes in multiple locations
+- Rich text editing with WYSIWYG and Markdown support
+- Code notes with syntax highlighting
+- Note attributes for organization and scripting
+- Note versioning and history
+- Note encryption and protection
+- Relation maps for visualizing connections between notes
+- Synchronization between devices
+
+Your primary goal is to help users find information in their notes, answer questions based on their knowledge base, and provide assistance with using TriliumNext Notes features.
+
+When responding to queries:
+1. For complex queries, decompose them into simpler parts and address each one
+2. When citing information from the user's notes, mention the note title (e.g., "According to your note titled 'Project Ideas'...")
+3. Focus on the user's personal knowledge base first, then supplement with general knowledge if needed
+4. Keep responses concise and directly relevant to the query
+5. For general questions about the user's notes, provide a summary of all relevant notes found, including brief summaries of individual notes
+6. For specific questions, provide detailed information from the user's notes that directly addresses the question
+7. Always prioritize information from the user's notes over your own knowledge, as the user's notes are likely more up-to-date and personally relevant
+```
\ No newline at end of file
diff --git a/src/services/llm/providers/anthropic_service.ts b/src/services/llm/providers/anthropic_service.ts
new file mode 100644
index 000000000..955ef494a
--- /dev/null
+++ b/src/services/llm/providers/anthropic_service.ts
@@ -0,0 +1,594 @@
+import options from '../../options.js';
+import { BaseAIService } from '../base_ai_service.js';
+import type { ChatCompletionOptions, ChatResponse, Message, StreamChunk } from '../ai_interface.js';
+import { PROVIDER_CONSTANTS } from '../constants/provider_constants.js';
+import type { AnthropicOptions } from './provider_options.js';
+import { getAnthropicOptions } from './providers.js';
+import log from '../../log.js';
+import Anthropic from '@anthropic-ai/sdk';
+import { SEARCH_CONSTANTS } from '../constants/search_constants.js';
+
+export class AnthropicService extends BaseAIService {
+    private client: any = null;
+
+    constructor() {
+        super('Anthropic');
+    }
+
+    isAvailable(): boolean {
+        return super.isAvailable() && !!options.getOption('anthropicApiKey');
+    }
+
+    private getClient(apiKey: string, baseUrl: string, apiVersion?: string, betaVersion?: string): any {
+        if (!this.client) {
+            this.client = new Anthropic({
+                apiKey,
+                baseURL: baseUrl,
+                defaultHeaders: {
+                    'anthropic-version': apiVersion || PROVIDER_CONSTANTS.ANTHROPIC.API_VERSION,
+                    'anthropic-beta': betaVersion || PROVIDER_CONSTANTS.ANTHROPIC.BETA_VERSION
+                }
+            });
+        }
+        return this.client;
+    }
+
+    async generateChatCompletion(messages: Message[], opts: ChatCompletionOptions = {}): Promise<ChatResponse> {
+        if (!this.isAvailable()) {
+            throw new Error('Anthropic service is not available. Check API key and AI settings.');
+        }
+
+        // Get provider-specific options from the central provider manager
+        const providerOptions = getAnthropicOptions(opts);
+
+        // Log provider metadata if available
+        if (providerOptions.providerMetadata) {
+            log.info(`Using model ${providerOptions.model} from provider ${providerOptions.providerMetadata.provider}`);
+
+            // Log capabilities if available
+            const capabilities = providerOptions.providerMetadata.capabilities;
+            if (capabilities) {
+                log.info(`Model capabilities: ${JSON.stringify(capabilities)}`);
+            }
+        }
+
+        // Get system prompt
+        const systemPrompt = this.getSystemPrompt(providerOptions.systemPrompt || options.getOption('aiSystemPrompt'));
+
+        // Format messages for Anthropic's API
+        const anthropicMessages = this.formatMessages(messages);
+
+        try {
+            // Initialize the Anthropic client
+            const client = this.getClient(
+                providerOptions.apiKey,
+                providerOptions.baseUrl,
+                providerOptions.apiVersion,
+                providerOptions.betaVersion
+            );
+
+            // Log API key format (without revealing the actual key)
+            const apiKeyPrefix = providerOptions.apiKey?.substring(0, 7) || 'undefined';
+            const apiKeyLength = providerOptions.apiKey?.length || 0;
+            log.info(`[DEBUG] Using Anthropic API key with prefix '${apiKeyPrefix}...' and length ${apiKeyLength}`);
+
+            log.info(`Using Anthropic API with model: ${providerOptions.model}`);
+
+            // Configure request parameters
+            const requestParams: any = {
+                model: providerOptions.model,
+                messages: anthropicMessages,
+                system: systemPrompt,
+                max_tokens: providerOptions.max_tokens || SEARCH_CONSTANTS.LIMITS.DEFAULT_MAX_TOKENS,
+                temperature: providerOptions.temperature,
+                top_p: providerOptions.top_p,
+                stream: !!providerOptions.stream
+            };
+
+            // Add tools support if provided
+            if (opts.tools && opts.tools.length > 0) {
+                log.info(`Adding ${opts.tools.length} tools to Anthropic request`);
+
+                // Convert OpenAI-style function tools to Anthropic format
+                const anthropicTools = this.convertToolsToAnthropicFormat(opts.tools);
+
+                requestParams.tools = anthropicTools;
+
+                // Add tool_choice parameter if specified
+                if (opts.tool_choice) {
+                    if (typeof opts.tool_choice === 'string' && opts.tool_choice === 'auto') {
+                        requestParams.tool_choice = 'auto';
+                    } else if (typeof opts.tool_choice === 'string' && opts.tool_choice === 'none') {
+                        requestParams.tool_choice = 'none';
+                    } else if (typeof opts.tool_choice === 'object' && opts.tool_choice.function) {
+                        // Map from OpenAI format to Anthropic format
+                        requestParams.tool_choice = opts.tool_choice.function.name;
+                    } else {
+                        requestParams.tool_choice = opts.tool_choice;
+                    }
+                }
+            }
+
+            // Log request summary
+            log.info(`Making ${providerOptions.stream ? 'streaming' : 'non-streaming'} request to Anthropic API with model: ${providerOptions.model}`);
+
+
+            // Handle streaming responses
+            if (providerOptions.stream) {
+                return this.handleStreamingResponse(client, requestParams, opts, providerOptions);
+            } else {
+                // Non-streaming request
+                const response = await client.messages.create(requestParams);
+
+                // Log the complete response for debugging
+                log.info(`[DEBUG] Complete Anthropic API response: ${JSON.stringify(response, null, 2)}`);
+
+                // Get the assistant's response text from the content blocks
+                const textContent = response.content
+                    .filter((block: any) => block.type === 'text')
+                    .map((block: any) => block.text)
+                    .join('');
+
+                // Process tool calls if any are present in the response
+                let toolCalls = null;
+                if (response.content) {
+                    const toolBlocks = response.content.filter((block: any) =>
+                        block.type === 'tool_use' ||
+                        (block.type === 'tool_result' && block.tool_use_id)
+                    );
+
+                    if (toolBlocks.length > 0) {
+                        log.info(`[DEBUG] Found ${toolBlocks.length} tool-related blocks in response`);
+
+                        toolCalls = toolBlocks.map((block: any) => {
+                            if (block.type === 'tool_use') {
+                                log.info(`[DEBUG] Processing tool_use block: ${JSON.stringify(block, null, 2)}`);
+
+                                // Convert Anthropic tool_use format to standard format expected by our app
+                                return {
+                                    id: block.id,
+                                    type: 'function', // Convert back to function type for internal use
+                                    function: {
+                                        name: block.name,
+                                        arguments: JSON.stringify(block.input || {})
+                                    }
+                                };
+                            }
+                            return null;
+                        }).filter(Boolean);
+
+                        log.info(`Extracted ${toolCalls.length} tool calls from Anthropic response`);
+                    }
+                }
+
+                return {
+                    text: textContent,
+                    model: response.model,
+                    provider: this.getName(),
+                    tool_calls: toolCalls,
+                    usage: {
+                        // Anthropic provides token counts in the response
+                        promptTokens: response.usage?.input_tokens,
+                        completionTokens: response.usage?.output_tokens,
+                        totalTokens: (response.usage?.input_tokens || 0) + (response.usage?.output_tokens || 0)
+                    }
+                };
+            }
+        } catch (error) {
+            log.error(`Anthropic service error: ${error}`);
+            throw error;
+        }
+    }
+
+    /**
+     * Handle streaming response from Anthropic
+     *
+     * Uses the MessageStream class from the Anthropic SDK
+     */
+    private async handleStreamingResponse(
+        client: Anthropic,
+        params: any,
+        opts: ChatCompletionOptions,
+        providerOptions: AnthropicOptions
+    ): Promise<ChatResponse> {
+        // Create a ChatResponse object that follows our interface requirements
+        const response: ChatResponse = {
+            text: '',
+            model: providerOptions.model,
+            provider: this.getName(),
+
+            // Define the stream function that will be used by consumers
+            stream: async (callback) => {
+                // Accumulated response
+                let fullText = '';
+                let toolCalls: any[] = [];
+
+                try {
+                    log.info(`Creating Anthropic streaming request for model: ${providerOptions.model}`);
+
+                    // Request options to pass to the Anthropic SDK
+                    const requestOptions = {};
+
+                    // Create a message stream using the SDK's stream method
+                    // This properly types the streaming response
+                    const stream = client.messages.stream({
+                        ...params,
+                    }, requestOptions);
+
+                    // Track active tool calls by ID
+                    const activeToolCalls = new Map<string, any>();
+
+                    // Listen for text deltas
+                    stream.on('text', (textDelta) => {
+                        fullText += textDelta;
+
+                        // Pass the text chunk to the caller
+                        callback({
+                            text: textDelta,
+                            done: false,
+                            raw: { type: 'text', text: textDelta }
+                        });
+                    });
+
+                    // Listen for content blocks starting - used for tool calls
+                    stream.on('contentBlock', async (block) => {
+                        if (block.type === 'tool_use') {
+                            // Create a structured tool call in our expected format
+                            const toolCall = {
+                                id: block.id,
+                                type: 'function',
+                                function: {
+                                    name: block.name,
+                                    arguments: JSON.stringify(block.input || {})
+                                }
+                            };
+
+                            // Store in our active tools map
+                            activeToolCalls.set(block.id, toolCall);
+
+                            // Notify about tool execution start
+                            await callback({
+                                text: '',
+                                done: false,
+                                toolExecution: {
+                                    type: 'start',
+                                    tool: {
+                                        name: toolCall.function.name,
+                                        arguments: JSON.parse(toolCall.function.arguments || '{}')
+                                    }
+                                },
+                                raw: { ...block } as unknown as Record<string, unknown>
+                            });
+                        }
+                    });
+
+                    // Listen for input JSON updates (tool arguments)
+                    stream.on('inputJson', async (jsonFragment) => {
+                        // Find the most recent tool call
+                        if (activeToolCalls.size > 0) {
+                            const lastToolId = Array.from(activeToolCalls.keys()).pop();
+                            if (lastToolId) {
+                                const toolCall = activeToolCalls.get(lastToolId);
+
+                                // Update the arguments
+                                if (toolCall.function.arguments === '{}') {
+                                    toolCall.function.arguments = jsonFragment;
+                                } else {
+                                    toolCall.function.arguments += jsonFragment;
+                                }
+
+                                // Notify about the update
+                                await callback({
+                                    text: '',
+                                    done: false,
+                                    toolExecution: {
+                                        type: 'update',
+                                        tool: toolCall
+                                    },
+                                    raw: { type: 'json_fragment', data: jsonFragment } as Record<string, unknown>
+                                });
+                            }
+                        }
+                    });
+
+                    // Listen for message completion
+                    stream.on('message', async (message) => {
+                        // Process any tool calls from the message
+                        if (message.content) {
+                            // Find tool use blocks in the content
+                            const toolUseBlocks = message.content.filter(
+                                block => block.type === 'tool_use'
+                            );
+
+                            // Convert tool use blocks to our expected format
+                            if (toolUseBlocks.length > 0) {
+                                toolCalls = toolUseBlocks.map(block => {
+                                    if (block.type === 'tool_use') {
+                                        return {
+                                            id: block.id,
+                                            type: 'function',
+                                            function: {
+                                                name: block.name,
+                                                arguments: JSON.stringify(block.input || {})
+                                            }
+                                        };
+                                    }
+                                    return null;
+                                }).filter(Boolean);
+
+                                // For any active tool calls, mark them as complete
+                                for (const [toolId, toolCall] of activeToolCalls.entries()) {
+                                    await callback({
+                                        text: '',
+                                        done: false,
+                                        toolExecution: {
+                                            type: 'complete',
+                                            tool: toolCall
+                                        },
+                                        raw: { type: 'tool_complete', toolId }
+                                    });
+                                }
+                            }
+
+                            // Extract text from text blocks
+                            const textBlocks = message.content.filter(
+                                block => block.type === 'text'
+                            ) as Array<{ type: 'text', text: string }>;
+
+                            // Update fullText if needed
+                            if (textBlocks.length > 0) {
+                                const allText = textBlocks.map(block => block.text).join('');
+                                // Only update if different from what we've accumulated
+                                if (allText !== fullText) {
+                                    fullText = allText;
+                                }
+                            }
+                        }
+                    });
+
+                    // Listen for the final message
+                    stream.on('finalMessage', async (message) => {
+                        // Set the response text and tool calls
+                        response.text = fullText;
+                        if (toolCalls.length > 0) {
+                            response.tool_calls = toolCalls;
+                        }
+
+                        // Send final completion with full text and all tool calls
+                        await callback({
+                            text: typeof message.content === 'string' ?
+                                message.content :
+                                message.content
+                                  .filter((block: any) => block.type === 'text')
+                                  .map((block: any) => block.text)
+                                  .join(''),
+                            done: message.role === 'assistant',
+                            raw: { ...message } as unknown as Record<string, unknown>
+                        });
+                    });
+
+                    // Listen for errors
+                    stream.on('error', (error) => {
+                        log.error(`Anthropic streaming error: ${error}`);
+                        throw error;
+                    });
+
+                    // Wait for the stream to complete
+                    await stream.done();
+
+                    return fullText;
+                } catch (error) {
+                    log.error(`Anthropic streaming error: ${error}`);
+
+                    // Enhanced error diagnostic for Anthropic SDK errors
+                    if (error instanceof Error) {
+                        log.error(`Error name: ${error.name}`);
+                        log.error(`Error message: ${error.message}`);
+
+                        // Type cast to access potential Anthropic API error properties
+                        const apiError = error as any;
+                        if (apiError.status) {
+                            log.error(`API status: ${apiError.status}`);
+                        }
+                        if (apiError.error) {
+                            log.error(`API error details: ${JSON.stringify(apiError.error)}`);
+                        }
+                    }
+
+                    throw error;
+                }
+            }
+        };
+
+        return response;
+    }
+
+    /**
+     * Format messages for the Anthropic API
+     */
+    private formatMessages(messages: Message[]): any[] {
+        const anthropicMessages: any[] = [];
+
+        // Process each message
+        for (const msg of messages) {
+            if (msg.role === 'system') {
+                // System messages are handled separately in the API call
+                continue;
+            } else if (msg.role === 'user') {
+                // Convert user message to Anthropic format
+                anthropicMessages.push({
+                    role: msg.role,
+                    content: msg.content
+                });
+            } else if (msg.role === 'assistant') {
+                // Assistant messages need special handling for tool_calls
+                if (msg.tool_calls && msg.tool_calls.length > 0) {
+                    // Create content blocks array for tool calls
+                    const content = [];
+
+                    // Add text content if present
+                    if (msg.content) {
+                        content.push({
+                            type: 'text',
+                            text: msg.content
+                        });
+                    }
+
+                    // Add tool_use blocks for each tool call
+                    for (const toolCall of msg.tool_calls) {
+                        if (toolCall.function && toolCall.function.name) {
+                            try {
+                                // Parse arguments if they're a string
+                                let parsedArgs = toolCall.function.arguments;
+                                if (typeof parsedArgs === 'string') {
+                                    try {
+                                        parsedArgs = JSON.parse(parsedArgs);
+                                    } catch (e) {
+                                        // Keep as string if parsing fails
+                                        log.info(`Could not parse tool arguments as JSON: ${e}`);
+                                    }
+                                }
+
+                                // Add tool_use block
+                                content.push({
+                                    type: 'tool_use',
+                                    id: toolCall.id || `tool_${Date.now()}`,
+                                    name: toolCall.function.name,
+                                    input: parsedArgs
+                                });
+                            } catch (e) {
+                                log.error(`Error processing tool call: ${e}`);
+                            }
+                        }
+                    }
+
+                    // Add the assistant message with content blocks
+                    anthropicMessages.push({
+                        role: 'assistant',
+                        content
+                    });
+                } else {
+                    // Regular assistant message without tool calls
+                    anthropicMessages.push({
+                        role: 'assistant',
+                        content: msg.content
+                    });
+                }
+            } else if (msg.role === 'tool') {
+                // Tool response messages need to be properly formatted as tool_result
+                if (msg.tool_call_id) {
+                    // Format as a tool_result message
+                    anthropicMessages.push({
+                        role: 'user',
+                        content: [
+                            {
+                                type: 'tool_result',
+                                tool_use_id: msg.tool_call_id,
+                                content: msg.content
+                            }
+                        ]
+                    });
+                } else {
+                    // Fallback if no tool_call_id is present
+                    anthropicMessages.push({
+                        role: 'user',
+                        content: msg.content
+                    });
+                }
+            }
+        }
+
+        return anthropicMessages;
+    }
+
+    /**
+     * Convert OpenAI-style function tools to Anthropic format
+     * OpenAI uses: { type: "function", function: { name, description, parameters } }
+     * Anthropic uses: { name, description, input_schema }
+     */
+    private convertToolsToAnthropicFormat(tools: any[]): any[] {
+        if (!tools || tools.length === 0) {
+            return [];
+        }
+
+        log.info(`[TOOL DEBUG] Converting ${tools.length} tools to Anthropic format`);
+
+        // Filter out invalid tools
+        const validTools = tools.filter(tool => {
+            if (!tool || typeof tool !== 'object') {
+                log.error(`Invalid tool format (not an object)`);
+                return false;
+            }
+
+            // For function tools, validate required fields
+            if (tool.type === 'function') {
+                if (!tool.function || !tool.function.name) {
+                    log.error(`Function tool missing required fields`);
+                    return false;
+                }
+            }
+
+            return true;
+        });
+
+        if (validTools.length < tools.length) {
+            log.info(`Filtered out ${tools.length - validTools.length} invalid tools`);
+        }
+
+        // Convert tools to Anthropic format
+        const convertedTools = validTools.map((tool: any) => {
+            // Convert from OpenAI format to Anthropic format
+            if (tool.type === 'function' && tool.function) {
+                log.info(`[TOOL DEBUG] Converting function tool: ${tool.function.name}`);
+
+                // Check the parameters structure
+                if (tool.function.parameters) {
+                    log.info(`[TOOL DEBUG] Parameters for ${tool.function.name}:`);
+                    log.info(`[TOOL DEBUG] - Type: ${tool.function.parameters.type}`);
+                    log.info(`[TOOL DEBUG] - Properties: ${JSON.stringify(tool.function.parameters.properties || {})}`);
+                    log.info(`[TOOL DEBUG] - Required: ${JSON.stringify(tool.function.parameters.required || [])}`);
+
+                    // Check if the required array is present and properly populated
+                    if (!tool.function.parameters.required || !Array.isArray(tool.function.parameters.required)) {
+                        log.error(`[TOOL DEBUG] WARNING: Tool ${tool.function.name} missing required array in parameters`);
+                    } else if (tool.function.parameters.required.length === 0) {
+                        log.error(`[TOOL DEBUG] WARNING: Tool ${tool.function.name} has empty required array - Anthropic may send empty inputs`);
+                    }
+                } else {
+                    log.error(`[TOOL DEBUG] WARNING: Tool ${tool.function.name} has no parameters defined`);
+                }
+
+                return {
+                    name: tool.function.name,
+                    description: tool.function.description || '',
+                    input_schema: tool.function.parameters || {}
+                };
+            }
+
+            // Handle already converted Anthropic format (from our temporary fix)
+            if (tool.type === 'custom' && tool.custom) {
+                log.info(`[TOOL DEBUG] Converting custom tool: ${tool.custom.name}`);
+                return {
+                    name: tool.custom.name,
+                    description: tool.custom.description || '',
+                    input_schema: tool.custom.parameters || {}
+                };
+            }
+
+            // If the tool is already in the correct Anthropic format
+            if (tool.name && (tool.input_schema || tool.parameters)) {
+                log.info(`[TOOL DEBUG] Tool already in Anthropic format: ${tool.name}`);
+                return {
+                    name: tool.name,
+                    description: tool.description || '',
+                    input_schema: tool.input_schema || tool.parameters
+                };
+            }
+
+            log.error(`Unhandled tool format encountered`);
+            return null;
+        }).filter(Boolean); // Filter out any null values
+
+        return convertedTools;
+    }
+}
diff --git a/src/services/llm/providers/ollama_service.ts b/src/services/llm/providers/ollama_service.ts
new file mode 100644
index 000000000..5e6204fe0
--- /dev/null
+++ b/src/services/llm/providers/ollama_service.ts
@@ -0,0 +1,512 @@
+import { BaseAIService } from '../base_ai_service.js';
+import type { Message, ChatCompletionOptions, ChatResponse, StreamChunk } from '../ai_interface.js';
+import { OllamaMessageFormatter } from '../formatters/ollama_formatter.js';
+import log from '../../log.js';
+import type { ToolCall, Tool } from '../tools/tool_interfaces.js';
+import toolRegistry from '../tools/tool_registry.js';
+import type { OllamaOptions } from './provider_options.js';
+import { getOllamaOptions } from './providers.js';
+import { Ollama, type ChatRequest, type ChatResponse as OllamaChatResponse } from 'ollama';
+import options from '../../options.js';
+import {
+    StreamProcessor,
+    createStreamHandler,
+    performProviderHealthCheck,
+    processProviderStream,
+    extractStreamStats
+} from './stream_handler.js';
+
+// Add an interface for tool execution feedback status
+interface ToolExecutionStatus {
+    toolCallId: string;
+    name: string;
+    success: boolean;
+    result: string;
+    error?: string;
+}
+
+// Interface for Ollama-specific messages
+interface OllamaMessage {
+    role: string;
+    content: string;
+    tool_call_id?: string;
+    tool_calls?: OllamaToolCall[];
+    name?: string;
+}
+
+// Interface for Ollama tool calls
+interface OllamaToolCall {
+    id: string;
+    function: {
+        name: string;
+        arguments: Record<string, unknown>;
+    };
+}
+
+// Interface for Ollama request options
+interface OllamaRequestOptions {
+    model: string;
+    messages: OllamaMessage[];
+    stream?: boolean;
+    options?: Record<string, unknown>;
+    format?: string;
+    tools?: Tool[];
+    [key: string]: unknown;
+}
+
+export class OllamaService extends BaseAIService {
+    private formatter: OllamaMessageFormatter;
+    private client: Ollama | null = null;
+
+    constructor() {
+        super('Ollama');
+        this.formatter = new OllamaMessageFormatter();
+    }
+
+    isAvailable(): boolean {
+        return super.isAvailable() && !!options.getOption('ollamaBaseUrl');
+    }
+
+    private getClient(): Ollama {
+        if (!this.client) {
+            const baseUrl = options.getOption('ollamaBaseUrl');
+            if (!baseUrl) {
+                throw new Error('Ollama base URL is not configured');
+            }
+
+            log.info(`Creating new Ollama client with base URL: ${baseUrl}`);
+
+            // Create client with debug options
+            try {
+                this.client = new Ollama({
+                    host: baseUrl,
+                    fetch: (url, init) => {
+                        log.info(`Ollama API request to: ${url}`);
+                        log.info(`Ollama API request method: ${init?.method || 'GET'}`);
+                        log.info(`Ollama API request headers: ${JSON.stringify(init?.headers || {})}`);
+
+                        // Call the actual fetch
+                        return fetch(url, init).then(response => {
+                            log.info(`Ollama API response status: ${response.status}`);
+                            if (!response.ok) {
+                                log.error(`Ollama API error response: ${response.statusText}`);
+                            }
+                            return response;
+                        }).catch(error => {
+                            log.error(`Ollama API fetch error: ${error.message}`);
+                            throw error;
+                        });
+                    }
+                });
+
+                log.info(`Ollama client successfully created`);
+            } catch (error) {
+                log.error(`Error creating Ollama client: ${error}`);
+                throw error;
+            }
+        }
+        return this.client;
+    }
+
+    async generateChatCompletion(messages: Message[], opts: ChatCompletionOptions = {}): Promise<ChatResponse> {
+        if (!this.isAvailable()) {
+            throw new Error('Ollama service is not available. Check API URL in settings.');
+        }
+
+        // Get provider-specific options from the central provider manager
+        const providerOptions = await getOllamaOptions(opts);
+
+        // Log provider metadata if available
+        if (providerOptions.providerMetadata) {
+            log.info(`Using model ${providerOptions.model} from provider ${providerOptions.providerMetadata.provider}`);
+
+            // Log capabilities if available
+            const capabilities = providerOptions.providerMetadata.capabilities;
+            if (capabilities) {
+                log.info(`Model capabilities: ${JSON.stringify(capabilities)}`);
+            }
+        }
+
+        const systemPrompt = this.getSystemPrompt(providerOptions.systemPrompt || options.getOption('aiSystemPrompt'));
+
+        try {
+            // Check if we should add tool execution feedback
+            if (providerOptions.toolExecutionStatus && Array.isArray(providerOptions.toolExecutionStatus) && providerOptions.toolExecutionStatus.length > 0) {
+                log.info(`Adding tool execution feedback to messages`);
+                messages = this.addToolExecutionFeedback(messages, providerOptions.toolExecutionStatus as ToolExecutionStatus[]);
+            }
+
+            // Determine whether to use the formatter or send messages directly
+            let messagesToSend: Message[];
+
+            if (providerOptions.bypassFormatter) {
+                // Bypass the formatter entirely - use messages as is
+                messagesToSend = [...messages];
+                log.info(`Bypassing formatter for Ollama request with ${messages.length} messages`);
+            } else {
+                // Use the formatter to prepare messages
+                messagesToSend = this.formatter.formatMessages(
+                    messages,
+                    systemPrompt,
+                    undefined, // context
+                    providerOptions.preserveSystemPrompt
+                );
+                log.info(`Sending to Ollama with formatted messages: ${messagesToSend.length}`);
+            }
+
+            // Get tools if enabled
+            let tools: Tool[] = [];
+            if (providerOptions.enableTools !== false) {
+                try {
+                    tools = providerOptions.tools && providerOptions.tools.length > 0
+                        ? providerOptions.tools as Tool[]
+                        : toolRegistry.getAllToolDefinitions();
+
+                    // Handle empty tools array
+                    if (tools.length === 0) {
+                        log.info('No tools found, attempting to initialize tools...');
+                        // Tools are already initialized in the AIServiceManager constructor
+                        // No need to initialize them again
+                        tools = toolRegistry.getAllToolDefinitions();
+                        log.info(`After initialization: ${tools.length} tools available`);
+                    }
+
+                    if (tools.length > 0) {
+                        log.info(`Sending ${tools.length} tool definitions to Ollama`);
+                    }
+                } catch (error) {
+                    const errorMsg = error instanceof Error ? error.message : String(error);
+                    log.error(`Error preparing tools: ${errorMsg}`);
+                    tools = []; // Empty fallback
+                }
+            }
+
+            // Convert our message format to Ollama's format
+            const convertedMessages = messagesToSend.map(msg => {
+                const converted: OllamaMessage = {
+                    role: msg.role,
+                    content: msg.content
+                };
+
+                if (msg.tool_calls) {
+                    converted.tool_calls = msg.tool_calls.map(tc => {
+                        // For Ollama, arguments must be an object, not a string
+                        let processedArgs: Record<string, unknown> = {};
+
+                        // If arguments is a string, try to parse it as JSON
+                        if (typeof tc.function.arguments === 'string') {
+                            try {
+                                processedArgs = JSON.parse(tc.function.arguments);
+                            } catch (e) {
+                                // If parsing fails, create an object with a single property
+                                log.info(`Could not parse tool arguments as JSON: ${e}`);
+                                processedArgs = { raw: tc.function.arguments };
+                            }
+                        } else if (typeof tc.function.arguments === 'object') {
+                            processedArgs = tc.function.arguments as Record<string, unknown>;
+                        }
+
+                        return {
+                            id: tc.id ?? '',
+                            function: {
+                                name: tc.function.name,
+                                arguments: processedArgs
+                            }
+                        };
+                    });
+                }
+
+                if (msg.tool_call_id) {
+                    converted.tool_call_id = msg.tool_call_id;
+                }
+
+                if (msg.name) {
+                    converted.name = msg.name;
+                }
+
+                return converted;
+            });
+
+            // Prepare base request options
+            const baseRequestOptions: OllamaRequestOptions = {
+                model: providerOptions.model,
+                messages: convertedMessages,
+                stream: opts.stream === true
+            };
+
+            // Add tool definitions if available
+            if (tools && tools.length > 0 && providerOptions.enableTools !== false) {
+                baseRequestOptions.tools = tools;
+            }
+
+            // Add any model-specific parameters
+            if (providerOptions.options) {
+                baseRequestOptions.options = providerOptions.options;
+            }
+
+            // If JSON response is expected, set format
+            if (providerOptions.expectsJsonResponse) {
+                baseRequestOptions.format = 'json';
+            }
+
+            log.info(`Sending request to Ollama with model: ${providerOptions.model}`);
+
+            // Handle streaming vs non-streaming responses
+            const client = this.getClient();
+
+            if (opts.stream === true) {
+                // Use streaming API
+                return this.handleStreamingResponse(client, baseRequestOptions, opts, providerOptions);
+            } else {
+                // Use non-streaming API
+                try {
+                    log.info(`Sending non-streaming request to Ollama`);
+                    // Create a properly typed request with stream: false
+                    const chatRequest: ChatRequest & { stream?: false } = {
+                        ...baseRequestOptions,
+                        stream: false
+                    };
+
+                    const response = await client.chat(chatRequest);
+
+                    log.info(`Received response from Ollama`);
+
+                    // Transform tool calls if present
+                    const toolCalls = this.transformToolCalls(response.message.tool_calls);
+
+                    return {
+                        text: response.message.content,
+                        model: providerOptions.model,
+                        provider: 'ollama',
+                        tool_calls: toolCalls.length > 0 ? toolCalls : undefined
+                    };
+                } catch (error) {
+                    const errorMsg = error instanceof Error ? error.message : String(error);
+                    log.error(`Error in Ollama request: ${errorMsg}`);
+                    throw error;
+                }
+            }
+        } catch (error) {
+            const errorMsg = error instanceof Error ? error.message : String(error);
+            log.error(`Error in Ollama service: ${errorMsg}`);
+            throw error;
+        }
+    }
+
+    /**
+     * Handle streaming response from Ollama
+     *
+     * Uses reusable stream handling utilities for processing
+     */
+    private async handleStreamingResponse(
+        client: Ollama,
+        requestOptions: OllamaRequestOptions,
+        opts: ChatCompletionOptions,
+        providerOptions: OllamaOptions
+    ): Promise<ChatResponse> {
+        log.info(`Using streaming mode with Ollama client`);
+
+        // Log detailed information about the streaming setup
+        log.info(`Ollama streaming details: model=${providerOptions.model}, streamCallback=${opts.streamCallback ? 'provided' : 'not provided'}`);
+
+        // Create streaming request
+        const streamingRequest = {
+            ...requestOptions,
+            stream: true as const
+        };
+
+        // Handle direct streamCallback if provided
+        if (opts.streamCallback) {
+            try {
+                // Perform health check before streaming
+                await performProviderHealthCheck(
+                    async () => await client.list(),
+                    this.getName()
+                );
+
+                log.info(`Making Ollama streaming request after successful health check`);
+                // Get the stream iterator
+                const streamIterator = await client.chat(streamingRequest);
+
+                // Process the stream with our reusable utility
+                const streamResult = await processProviderStream(
+                    streamIterator,
+                    {
+                        providerName: this.getName(),
+                        modelName: providerOptions.model
+                    },
+                    opts.streamCallback
+                );
+
+                // Create the final response after streaming is complete
+                return {
+                    text: streamResult.completeText,
+                    model: providerOptions.model,
+                    provider: this.getName(),
+                    tool_calls: this.transformToolCalls(streamResult.toolCalls),
+                    usage: extractStreamStats(streamResult.finalChunk, this.getName())
+                };
+            } catch (error) {
+                log.error(`Error in Ollama streaming with callback: ${error}`);
+                log.error(`Error details: ${error instanceof Error ? error.stack : 'No stack trace available'}`);
+                throw error;
+            }
+        } else {
+            // Create a stream handler using our reusable StreamProcessor
+            const streamHandler = createStreamHandler(
+                {
+                    providerName: this.getName(),
+                    modelName: providerOptions.model,
+                    streamCallback: opts.streamCallback
+                },
+                async (callback) => {
+                    let completeText = '';
+                    let responseToolCalls: any[] = [];
+                    let chunkCount = 0;
+
+                    try {
+                        // Perform health check
+                        await performProviderHealthCheck(
+                            async () => await client.list(),
+                            this.getName()
+                        );
+
+                        // Get the stream iterator
+                        log.info(`Getting stream iterator from Ollama`);
+                        const streamIterator = await client.chat(streamingRequest);
+
+                        if (!streamIterator || typeof streamIterator[Symbol.asyncIterator] !== 'function') {
+                            throw new Error('Invalid stream iterator returned');
+                        }
+
+                        // Process each chunk using our stream processor
+                        for await (const chunk of streamIterator) {
+                            chunkCount++;
+
+                            // Process the chunk and update our accumulated text
+                            const result = await StreamProcessor.processChunk(
+                                chunk,
+                                completeText,
+                                chunkCount,
+                                { providerName: this.getName(), modelName: providerOptions.model }
+                            );
+
+                            completeText = result.completeText;
+
+                            // Extract any tool calls
+                            const toolCalls = StreamProcessor.extractToolCalls(chunk);
+                            if (toolCalls.length > 0) {
+                                responseToolCalls = toolCalls;
+                            }
+
+                            // Send to callback - directly pass the content without accumulating
+                            await callback({
+                                text: chunk.message?.content || '',
+                                done: false,  // Add done property to satisfy StreamChunk
+                                raw: chunk as unknown as Record<string, unknown>
+                            });
+
+                            // Log completion
+                            if (chunk.done && !result.logged) {
+                                log.info(`Reached final chunk after ${chunkCount} chunks, content length: ${completeText.length} chars`);
+                            }
+                        }
+
+                        return completeText;
+                    } catch (error) {
+                        log.error(`Error in Ollama streaming: ${error}`);
+                        log.error(`Error details: ${error instanceof Error ? error.stack : 'No stack trace available'}`);
+                        throw error;
+                    }
+                }
+            );
+
+            // Return a response object with the stream handler
+            return {
+                text: '', // Initial text is empty, will be populated during streaming
+                model: providerOptions.model,
+                provider: this.getName(),
+                stream: streamHandler as (callback: (chunk: StreamChunk) => Promise<void> | void) => Promise<string>
+            };
+        }
+    }
+
+    /**
+     * Transform Ollama tool calls to the standard format expected by the pipeline
+     */
+    private transformToolCalls(toolCalls: any[] | undefined): ToolCall[] {
+        if (!toolCalls || !Array.isArray(toolCalls) || toolCalls.length === 0) {
+            return [];
+        }
+
+        return toolCalls.map((toolCall, index) => {
+            // Generate a unique ID if none is provided
+            const id = toolCall.id || `tool-call-${Date.now()}-${index}`;
+
+            // Handle arguments based on their type
+            let processedArguments: Record<string, any> | string = toolCall.function?.arguments || {};
+
+            if (typeof processedArguments === 'string') {
+                try {
+                    processedArguments = JSON.parse(processedArguments);
+                } catch (error) {
+                    // If we can't parse as JSON, create a simple object
+                    log.info(`Could not parse tool arguments as JSON in transformToolCalls: ${error}`);
+                    processedArguments = { raw: processedArguments };
+                }
+            }
+
+            return {
+                id,
+                type: 'function',
+                function: {
+                    name: toolCall.function?.name || '',
+                    arguments: processedArguments
+                }
+            };
+        });
+    }
+
+    /**
+     * Adds a system message with feedback about tool execution status
+     * @param messages The current message array
+     * @param toolExecutionStatus Array of tool execution status objects
+     * @returns Updated message array with feedback
+     */
+    private addToolExecutionFeedback(messages: Message[], toolExecutionStatus: ToolExecutionStatus[]): Message[] {
+        if (!toolExecutionStatus || toolExecutionStatus.length === 0) {
+            return messages;
+        }
+
+        // Create a copy of the messages
+        const updatedMessages = [...messages];
+
+        // Create a feedback message that explains what happened with each tool call
+        let feedbackContent = `Tool execution feedback:\n\n`;
+
+        toolExecutionStatus.forEach((status, index) => {
+            // Add status for each tool
+            const statusText = status.success ? 'successfully executed' : 'failed to execute';
+            const toolName = status.name || 'unknown tool';
+
+            feedbackContent += `Tool call ${index + 1} (${toolName}): ${statusText}\n`;
+
+            // Add error information if available and tool failed
+            if (!status.success && status.error) {
+                feedbackContent += `Error: ${status.error}\n`;
+                feedbackContent += `Please fix this issue in your next response or try a different approach.\n`;
+            }
+
+            feedbackContent += `\n`;
+        });
+
+        // Add feedback message to the conversation
+        updatedMessages.push({
+            role: 'system',
+            content: feedbackContent
+        });
+
+        log.info(`Added tool execution feedback: ${toolExecutionStatus.length} statuses`);
+        return updatedMessages;
+    }
+}
diff --git a/src/services/llm/providers/openai_service.ts b/src/services/llm/providers/openai_service.ts
new file mode 100644
index 000000000..799ba9c1f
--- /dev/null
+++ b/src/services/llm/providers/openai_service.ts
@@ -0,0 +1,247 @@
+import options from '../../options.js';
+import { BaseAIService } from '../base_ai_service.js';
+import type { ChatCompletionOptions, ChatResponse, Message, StreamChunk } from '../ai_interface.js';
+import { getOpenAIOptions } from './providers.js';
+import OpenAI from 'openai';
+
+export class OpenAIService extends BaseAIService {
+    private openai: OpenAI | null = null;
+
+    constructor() {
+        super('OpenAI');
+    }
+
+    isAvailable(): boolean {
+        return super.isAvailable() && !!options.getOption('openaiApiKey');
+    }
+
+    private getClient(apiKey: string, baseUrl?: string): OpenAI {
+        if (!this.openai) {
+            this.openai = new OpenAI({
+                apiKey,
+                baseURL: baseUrl
+            });
+        }
+        return this.openai;
+    }
+
+    async generateChatCompletion(messages: Message[], opts: ChatCompletionOptions = {}): Promise<ChatResponse> {
+        if (!this.isAvailable()) {
+            throw new Error('OpenAI service is not available. Check API key and AI settings.');
+        }
+
+        // Get provider-specific options from the central provider manager
+        const providerOptions = getOpenAIOptions(opts);
+
+        // Initialize the OpenAI client
+        const client = this.getClient(providerOptions.apiKey, providerOptions.baseUrl);
+
+        const systemPrompt = this.getSystemPrompt(providerOptions.systemPrompt || options.getOption('aiSystemPrompt'));
+
+        // Ensure we have a system message
+        const systemMessageExists = messages.some(m => m.role === 'system');
+        const messagesWithSystem = systemMessageExists
+            ? messages
+            : [{ role: 'system', content: systemPrompt }, ...messages];
+
+        try {
+            // Create params object for the OpenAI SDK
+            const params: OpenAI.Chat.ChatCompletionCreateParams = {
+                model: providerOptions.model,
+                messages: messagesWithSystem as OpenAI.Chat.ChatCompletionMessageParam[],
+                temperature: providerOptions.temperature,
+                max_tokens: providerOptions.max_tokens,
+                stream: providerOptions.stream,
+                top_p: providerOptions.top_p,
+                frequency_penalty: providerOptions.frequency_penalty,
+                presence_penalty: providerOptions.presence_penalty
+            };
+
+            // Add tools if enabled
+            if (providerOptions.enableTools && providerOptions.tools && providerOptions.tools.length > 0) {
+                params.tools = providerOptions.tools as OpenAI.Chat.ChatCompletionTool[];
+            }
+
+            if (providerOptions.tool_choice) {
+                params.tool_choice = providerOptions.tool_choice as OpenAI.Chat.ChatCompletionToolChoiceOption;
+            }
+
+            // Log the request parameters
+            console.log('OpenAI API Request:', JSON.stringify({
+                endpoint: 'chat.completions.create',
+                model: params.model,
+                messages: params.messages,
+                temperature: params.temperature,
+                max_tokens: params.max_tokens,
+                stream: params.stream,
+                tools: params.tools,
+                tool_choice: params.tool_choice
+            }, null, 2));
+
+            // If streaming is requested
+            if (providerOptions.stream) {
+                params.stream = true;
+
+                // Get stream from OpenAI SDK
+                const stream = await client.chat.completions.create(params);
+                console.log('OpenAI API Stream Started');
+
+                // Create a closure to hold accumulated tool calls
+                let accumulatedToolCalls: any[] = [];
+
+                // Return a response with the stream handler
+                const response: ChatResponse = {
+                    text: '', // Initial empty text, will be populated during streaming
+                    model: params.model,
+                    provider: this.getName(),
+                    // Add tool_calls property that will be populated during streaming
+                    tool_calls: [],
+                    stream: async (callback) => {
+                        let completeText = '';
+
+                        try {
+                            // Process the stream
+                            if (Symbol.asyncIterator in stream) {
+                                for await (const chunk of stream as AsyncIterable<OpenAI.Chat.ChatCompletionChunk>) {
+                                    // Log each chunk received from OpenAI
+                                    console.log('OpenAI API Stream Chunk:', JSON.stringify(chunk, null, 2));
+
+                                    const content = chunk.choices[0]?.delta?.content || '';
+                                    const isDone = !!chunk.choices[0]?.finish_reason;
+
+                                    // Check for tool calls in the delta
+                                    const deltaToolCalls = chunk.choices[0]?.delta?.tool_calls;
+
+                                    if (deltaToolCalls) {
+                                        // Process and accumulate tool calls from this chunk
+                                        for (const deltaToolCall of deltaToolCalls) {
+                                            const toolCallId = deltaToolCall.index;
+
+                                            // Initialize or update the accumulated tool call
+                                            if (!accumulatedToolCalls[toolCallId]) {
+                                                accumulatedToolCalls[toolCallId] = {
+                                                    id: deltaToolCall.id || `call_${toolCallId}`,
+                                                    type: deltaToolCall.type || 'function',
+                                                    function: {
+                                                        name: '',
+                                                        arguments: ''
+                                                    }
+                                                };
+                                            }
+
+                                            // Update function name if present
+                                            if (deltaToolCall.function?.name) {
+                                                accumulatedToolCalls[toolCallId].function.name =
+                                                    deltaToolCall.function.name;
+                                            }
+
+                                            // Append to function arguments if present
+                                            if (deltaToolCall.function?.arguments) {
+                                                accumulatedToolCalls[toolCallId].function.arguments +=
+                                                    deltaToolCall.function.arguments;
+                                            }
+                                        }
+
+                                        // Important: Update the response's tool_calls with accumulated tool calls
+                                        response.tool_calls = accumulatedToolCalls.filter(Boolean);
+                                    }
+
+                                    if (content) {
+                                        completeText += content;
+                                    }
+
+                                    // Send the chunk to the caller with raw data and any accumulated tool calls
+                                    const streamChunk: StreamChunk = {
+                                        text: content,
+                                        done: isDone,
+                                        raw: chunk as unknown as Record<string, unknown>
+                                    };
+
+                                    // Add accumulated tool calls to raw data for compatibility with tool execution display
+                                    if (accumulatedToolCalls.length > 0) {
+                                        // Add tool calls to raw data for proper display
+                                        streamChunk.raw = {
+                                            ...streamChunk.raw as object,
+                                            tool_calls: accumulatedToolCalls.filter(Boolean)
+                                        } as Record<string, unknown>;
+                                    }
+
+                                    await callback(streamChunk);
+
+                                    if (isDone) {
+                                        console.log('OpenAI API Stream Complete. Final text length:', completeText.length);
+                                        if (accumulatedToolCalls.length > 0) {
+                                            console.log('OpenAI API Tool Calls:', JSON.stringify(accumulatedToolCalls, null, 2));
+                                        }
+                                        break;
+                                    }
+                                }
+                            } else {
+                                // Fallback for non-iterable response
+                                console.warn('Stream is not iterable, falling back to non-streaming response');
+                                console.log('OpenAI API Non-iterable Stream Response:', JSON.stringify(stream, null, 2));
+
+                                if ('choices' in stream) {
+                                    const content = stream.choices[0]?.message?.content || '';
+                                    completeText = content;
+
+                                    // Check if there are tool calls in the non-stream response
+                                    const toolCalls = stream.choices[0]?.message?.tool_calls;
+                                    if (toolCalls) {
+                                        response.tool_calls = toolCalls;
+                                        console.log('OpenAI API Tool Calls in Non-iterable Response:', JSON.stringify(toolCalls, null, 2));
+                                    }
+
+                                    await callback({
+                                        text: content,
+                                        done: true,
+                                        raw: stream as unknown as Record<string, unknown>,
+                                        tool_calls: toolCalls
+                                    });
+                                }
+                            }
+                        } catch (error) {
+                            console.error('Error processing stream:', error);
+                            throw error;
+                        }
+
+                        // Update the response's text with the complete text
+                        response.text = completeText;
+
+                        // Return the complete text
+                        return completeText;
+                    }
+                };
+
+                return response;
+            } else {
+                // Non-streaming response
+                params.stream = false;
+
+                const completion = await client.chat.completions.create(params);
+
+                // Log the full response from OpenAI
+                console.log('OpenAI API Response:', JSON.stringify(completion, null, 2));
+
+                if (!('choices' in completion)) {
+                    throw new Error('Unexpected response format from OpenAI API');
+                }
+
+                return {
+                    text: completion.choices[0].message.content || '',
+                    model: completion.model,
+                    provider: this.getName(),
+                    usage: {
+                        promptTokens: completion.usage?.prompt_tokens,
+                        completionTokens: completion.usage?.completion_tokens,
+                        totalTokens: completion.usage?.total_tokens
+                    },
+                    tool_calls: completion.choices[0].message.tool_calls
+                };
+            }
+        } catch (error) {
+            console.error('OpenAI service error:', error);
+            throw error;
+        }
+    }
+}
diff --git a/src/services/llm/providers/provider_options.ts b/src/services/llm/providers/provider_options.ts
new file mode 100644
index 000000000..61b11ed8d
--- /dev/null
+++ b/src/services/llm/providers/provider_options.ts
@@ -0,0 +1,220 @@
+import type { Message, ChatCompletionOptions } from '../ai_interface.js';
+import type { ToolCall } from '../tools/tool_interfaces.js';
+
+/**
+ * Model metadata interface to track provider information
+ */
+export interface ModelMetadata {
+    // The provider that supports this model
+    provider: 'openai' | 'anthropic' | 'ollama' | 'local';
+    // The actual model identifier used by the provider's API
+    modelId: string;
+    // Display name for UI (optional)
+    displayName?: string;
+    // Model capabilities
+    capabilities?: {
+        contextWindow?: number;
+        supportsTools?: boolean;
+        supportsVision?: boolean;
+        supportsStreaming?: boolean;
+    };
+}
+
+/**
+ * Base provider configuration that's common to all providers
+ * but not necessarily sent directly to APIs
+ */
+export interface ProviderConfig {
+    // Internal configuration
+    systemPrompt?: string;
+    // Provider metadata for model routing
+    providerMetadata?: ModelMetadata;
+}
+
+/**
+ * OpenAI-specific options, structured to match the OpenAI API
+ */
+export interface OpenAIOptions extends ProviderConfig {
+    // Connection settings (not sent to API)
+    apiKey: string;
+    baseUrl: string;
+
+    // Direct API parameters as they appear in requests
+    model: string;
+    messages?: Message[];
+    temperature?: number;
+    max_tokens?: number;
+    stream?: boolean;
+    top_p?: number;
+    frequency_penalty?: number;
+    presence_penalty?: number;
+    tools?: any[];
+    tool_choice?: string | object;
+
+    // Internal control flags (not sent directly to API)
+    enableTools?: boolean;
+    // Streaming callback handler
+    streamCallback?: (text: string, isDone: boolean, originalChunk?: any) => Promise<void> | void;
+}
+
+/**
+ * Anthropic-specific options, structured to match the Anthropic API
+ */
+export interface AnthropicOptions extends ProviderConfig {
+    // Connection settings (not sent to API)
+    apiKey: string;
+    baseUrl: string;
+    apiVersion?: string;
+    betaVersion?: string;
+
+    // Direct API parameters as they appear in requests
+    model: string;
+    messages?: any[];
+    system?: string;
+    temperature?: number;
+    max_tokens?: number;
+    stream?: boolean;
+    top_p?: number;
+
+    // Internal parameters (not sent directly to API)
+    formattedMessages?: { messages: any[], system: string };
+    // Streaming callback handler
+    streamCallback?: (text: string, isDone: boolean, originalChunk?: any) => Promise<void> | void;
+}
+
+/**
+ * Ollama-specific options, structured to match the Ollama API
+ */
+export interface OllamaOptions extends ProviderConfig {
+    // Connection settings (not sent to API)
+    baseUrl: string;
+
+    // Direct API parameters as they appear in requests
+    model: string;
+    messages?: Message[];
+    stream?: boolean;
+    options?: {
+        temperature?: number;
+        num_ctx?: number;
+        top_p?: number;
+        top_k?: number;
+        num_predict?: number; // equivalent to max_tokens
+        response_format?: { type: string };
+    };
+    tools?: any[];
+
+    // Internal control flags (not sent directly to API)
+    enableTools?: boolean;
+    bypassFormatter?: boolean;
+    preserveSystemPrompt?: boolean;
+    expectsJsonResponse?: boolean;
+    toolExecutionStatus?: any[];
+    // Streaming callback handler
+    streamCallback?: (text: string, isDone: boolean, originalChunk?: any) => Promise<void> | void;
+}
+
+/**
+ * Create OpenAI options from generic options and config
+ */
+export function createOpenAIOptions(
+    opts: ChatCompletionOptions = {},
+    apiKey: string,
+    baseUrl: string,
+    defaultModel: string
+): OpenAIOptions {
+    return {
+        // Connection settings
+        apiKey,
+        baseUrl,
+
+        // API parameters
+        model: opts.model || defaultModel,
+        temperature: opts.temperature,
+        max_tokens: opts.maxTokens,
+        stream: opts.stream,
+        top_p: opts.topP,
+        frequency_penalty: opts.frequencyPenalty,
+        presence_penalty: opts.presencePenalty,
+        tools: opts.tools,
+
+        // Internal configuration
+        systemPrompt: opts.systemPrompt,
+        enableTools: opts.enableTools,
+        // Pass through streaming callback
+        streamCallback: opts.streamCallback,
+        // Include provider metadata
+        providerMetadata: opts.providerMetadata,
+    };
+}
+
+/**
+ * Create Anthropic options from generic options and config
+ */
+export function createAnthropicOptions(
+    opts: ChatCompletionOptions = {},
+    apiKey: string,
+    baseUrl: string,
+    defaultModel: string,
+    apiVersion: string,
+    betaVersion: string
+): AnthropicOptions {
+    return {
+        // Connection settings
+        apiKey,
+        baseUrl,
+        apiVersion,
+        betaVersion,
+
+        // API parameters
+        model: opts.model || defaultModel,
+        temperature: opts.temperature,
+        max_tokens: opts.maxTokens,
+        stream: opts.stream,
+        top_p: opts.topP,
+
+        // Internal configuration
+        systemPrompt: opts.systemPrompt,
+        // Pass through streaming callback
+        streamCallback: opts.streamCallback,
+        // Include provider metadata
+        providerMetadata: opts.providerMetadata,
+    };
+}
+
+/**
+ * Create Ollama options from generic options and config
+ */
+export function createOllamaOptions(
+    opts: ChatCompletionOptions = {},
+    baseUrl: string,
+    defaultModel: string,
+    contextWindow: number
+): OllamaOptions {
+    return {
+        // Connection settings
+        baseUrl,
+
+        // API parameters
+        model: opts.model || defaultModel,
+        stream: opts.stream,
+        options: {
+            temperature: opts.temperature,
+            num_ctx: contextWindow,
+            num_predict: opts.maxTokens,
+            response_format: opts.expectsJsonResponse ? { type: "json_object" } : undefined
+        },
+        tools: opts.tools,
+
+        // Internal configuration
+        systemPrompt: opts.systemPrompt,
+        enableTools: opts.enableTools,
+        bypassFormatter: opts.bypassFormatter,
+        preserveSystemPrompt: opts.preserveSystemPrompt,
+        expectsJsonResponse: opts.expectsJsonResponse,
+        toolExecutionStatus: opts.toolExecutionStatus,
+        // Pass through streaming callback
+        streamCallback: opts.streamCallback,
+        // Include provider metadata
+        providerMetadata: opts.providerMetadata,
+    };
+}
diff --git a/src/services/llm/providers/providers.ts b/src/services/llm/providers/providers.ts
new file mode 100644
index 000000000..478d441a5
--- /dev/null
+++ b/src/services/llm/providers/providers.ts
@@ -0,0 +1,612 @@
+import options from "../../options.js";
+import log from "../../log.js";
+import sql from "../../sql.js";
+import dateUtils from "../../date_utils.js";
+import { randomString } from "../../utils.js";
+import type { EmbeddingProvider, EmbeddingConfig } from "../embeddings/embeddings_interface.js";
+import { NormalizationStatus } from "../embeddings/embeddings_interface.js";
+import { OpenAIEmbeddingProvider } from "../embeddings/providers/openai.js";
+import { OllamaEmbeddingProvider } from "../embeddings/providers/ollama.js";
+import { VoyageEmbeddingProvider } from "../embeddings/providers/voyage.js";
+import type { OptionDefinitions } from "../../options_interface.js";
+import type { ChatCompletionOptions } from '../ai_interface.js';
+import type { OpenAIOptions, AnthropicOptions, OllamaOptions, ModelMetadata } from './provider_options.js';
+import {
+    createOpenAIOptions,
+    createAnthropicOptions,
+    createOllamaOptions
+} from './provider_options.js';
+import { PROVIDER_CONSTANTS } from '../constants/provider_constants.js';
+import { SEARCH_CONSTANTS, MODEL_CAPABILITIES } from '../constants/search_constants.js';
+
+/**
+ * Simple local embedding provider implementation
+ * This avoids the need to import a separate file which might not exist
+ */
+class SimpleLocalEmbeddingProvider implements EmbeddingProvider {
+    name = "local";
+    config: EmbeddingConfig;
+
+    constructor(config: EmbeddingConfig) {
+        this.config = config;
+    }
+
+    getConfig(): EmbeddingConfig {
+        return this.config;
+    }
+
+    /**
+     * Returns the normalization status of the local provider
+     * Local provider does not guarantee normalization
+     */
+    getNormalizationStatus(): NormalizationStatus {
+        return NormalizationStatus.NEVER; // Simple embedding does not normalize vectors
+    }
+
+    async generateEmbeddings(text: string): Promise<Float32Array> {
+        // Create deterministic embeddings based on text content
+        const result = new Float32Array(this.config.dimension || 384);
+
+        // Simple hash-based approach
+        for (let i = 0; i < result.length; i++) {
+            // Use character codes and position to generate values between -1 and 1
+            const charSum = Array.from(text).reduce((sum, char, idx) =>
+                sum + char.charCodeAt(0) * Math.sin(idx * 0.1), 0);
+            result[i] = Math.sin(i * 0.1 + charSum * 0.01);
+        }
+
+        return result;
+    }
+
+    async generateBatchEmbeddings(texts: string[]): Promise<Float32Array[]> {
+        return Promise.all(texts.map(text => this.generateEmbeddings(text)));
+    }
+
+    async generateNoteEmbeddings(context: any): Promise<Float32Array> {
+        // Combine text from context
+        const text = (context.title || "") + " " + (context.content || "");
+        return this.generateEmbeddings(text);
+    }
+
+    async generateBatchNoteEmbeddings(contexts: any[]): Promise<Float32Array[]> {
+        return Promise.all(contexts.map(context => this.generateNoteEmbeddings(context)));
+    }
+}
+
+const providers = new Map<string, EmbeddingProvider>();
+
+// Cache to track which provider errors have been logged
+const loggedProviderErrors = new Set<string>();
+
+/**
+ * Register a new embedding provider
+ */
+export function registerEmbeddingProvider(provider: EmbeddingProvider) {
+    providers.set(provider.name, provider);
+    log.info(`Registered embedding provider: ${provider.name}`);
+}
+
+/**
+ * Get all registered embedding providers
+ */
+export function getEmbeddingProviders(): EmbeddingProvider[] {
+    return Array.from(providers.values());
+}
+
+/**
+ * Get a specific embedding provider by name
+ */
+export function getEmbeddingProvider(name: string): EmbeddingProvider | undefined {
+    return providers.get(name);
+}
+
+/**
+ * Get all enabled embedding providers
+ */
+export async function getEnabledEmbeddingProviders(): Promise<EmbeddingProvider[]> {
+    if (!(await options.getOptionBool('aiEnabled'))) {
+        return [];
+    }
+
+    // Get providers from database ordered by priority
+    const dbProviders = await sql.getRows(`
+        SELECT providerId, name, config
+        FROM embedding_providers
+        ORDER BY priority DESC`
+    );
+
+    const result: EmbeddingProvider[] = [];
+
+    for (const row of dbProviders) {
+        const rowData = row as any;
+        const provider = providers.get(rowData.name);
+
+        if (provider) {
+            result.push(provider);
+        } else {
+            // Only log error if we haven't logged it before for this provider
+            if (!loggedProviderErrors.has(rowData.name)) {
+                log.error(`Enabled embedding provider ${rowData.name} not found in registered providers`);
+                loggedProviderErrors.add(rowData.name);
+            }
+        }
+    }
+
+    return result;
+}
+
+/**
+ * Create a new embedding provider configuration in the database
+ */
+export async function createEmbeddingProviderConfig(
+    name: string,
+    config: EmbeddingConfig,
+    priority = 0
+): Promise<string> {
+    const providerId = randomString(16);
+    const now = dateUtils.localNowDateTime();
+    const utcNow = dateUtils.utcNowDateTime();
+
+    await sql.execute(`
+        INSERT INTO embedding_providers
+        (providerId, name, priority, config,
+         dateCreated, utcDateCreated, dateModified, utcDateModified)
+        VALUES (?, ?, ?, ?, ?, ?, ?, ?)`,
+        [providerId, name, priority, JSON.stringify(config),
+            now, utcNow, now, utcNow]
+    );
+
+    return providerId;
+}
+
+/**
+ * Update an existing embedding provider configuration
+ */
+export async function updateEmbeddingProviderConfig(
+    providerId: string,
+    priority?: number,
+    config?: EmbeddingConfig
+): Promise<boolean> {
+    const now = dateUtils.localNowDateTime();
+    const utcNow = dateUtils.utcNowDateTime();
+
+    // Get existing provider
+    const provider = await sql.getRow(
+        "SELECT * FROM embedding_providers WHERE providerId = ?",
+        [providerId]
+    );
+
+    if (!provider) {
+        return false;
+    }
+
+    // Build update query parts
+    const updates = [];
+    const params: any[] = [];
+
+    if (priority !== undefined) {
+        updates.push("priority = ?");
+        params.push(priority);
+    }
+
+    if (config) {
+        updates.push("config = ?");
+        params.push(JSON.stringify(config));
+    }
+
+    if (updates.length === 0) {
+        return true; // Nothing to update
+    }
+
+    updates.push("dateModified = ?");
+    updates.push("utcDateModified = ?");
+    params.push(now, utcNow);
+
+    params.push(providerId);
+
+    // Execute update
+    await sql.execute(
+        `UPDATE embedding_providers SET ${updates.join(", ")} WHERE providerId = ?`,
+        params
+    );
+
+    return true;
+}
+
+/**
+ * Delete an embedding provider configuration
+ */
+export async function deleteEmbeddingProviderConfig(providerId: string): Promise<boolean> {
+    const result = await sql.execute(
+        "DELETE FROM embedding_providers WHERE providerId = ?",
+        [providerId]
+    );
+
+    return result.changes > 0;
+}
+
+/**
+ * Get all embedding provider configurations from the database
+ */
+export async function getEmbeddingProviderConfigs() {
+    return await sql.getRows("SELECT * FROM embedding_providers ORDER BY priority DESC");
+}
+
+/**
+ * Initialize the default embedding providers
+ */
+export async function initializeDefaultProviders() {
+    // Register built-in providers
+    try {
+        // Register OpenAI provider if API key is configured
+        const openaiApiKey = await options.getOption('openaiApiKey');
+        if (openaiApiKey) {
+            const openaiModel = await options.getOption('openaiEmbeddingModel') || 'text-embedding-3-small';
+            const openaiBaseUrl = await options.getOption('openaiBaseUrl') || 'https://api.openai.com/v1';
+
+            registerEmbeddingProvider(new OpenAIEmbeddingProvider({
+                model: openaiModel,
+                dimension: 1536, // OpenAI's typical dimension
+                type: 'float32',
+                apiKey: openaiApiKey,
+                baseUrl: openaiBaseUrl
+            }));
+
+            // Create OpenAI provider config if it doesn't exist
+            const existingOpenAI = await sql.getRow(
+                "SELECT * FROM embedding_providers WHERE name = ?",
+                ['openai']
+            );
+
+            if (!existingOpenAI) {
+                await createEmbeddingProviderConfig('openai', {
+                    model: openaiModel,
+                    dimension: 1536,
+                    type: 'float32'
+                }, 100);
+            }
+        }
+
+        // Register Voyage provider if API key is configured
+        const voyageApiKey = await options.getOption('voyageApiKey' as any);
+        if (voyageApiKey) {
+            const voyageModel = await options.getOption('voyageEmbeddingModel') || 'voyage-2';
+            const voyageBaseUrl = 'https://api.voyageai.com/v1';
+
+            registerEmbeddingProvider(new VoyageEmbeddingProvider({
+                model: voyageModel,
+                dimension: 1024, // Voyage's embedding dimension
+                type: 'float32',
+                apiKey: voyageApiKey,
+                baseUrl: voyageBaseUrl
+            }));
+
+            // Create Voyage provider config if it doesn't exist
+            const existingVoyage = await sql.getRow(
+                "SELECT * FROM embedding_providers WHERE name = ?",
+                ['voyage']
+            );
+
+            if (!existingVoyage) {
+                await createEmbeddingProviderConfig('voyage', {
+                    model: voyageModel,
+                    dimension: 1024,
+                    type: 'float32'
+                }, 75);
+            }
+        }
+
+        // Register Ollama provider if base URL is configured
+        const ollamaBaseUrl = await options.getOption('ollamaBaseUrl');
+        if (ollamaBaseUrl) {
+            // Use specific embedding models if available
+            const embeddingModel = await options.getOption('ollamaEmbeddingModel') || 'nomic-embed-text';
+
+            try {
+                // Create provider with initial dimension to be updated during initialization
+                const ollamaProvider = new OllamaEmbeddingProvider({
+                    model: embeddingModel,
+                    dimension: 768, // Initial value, will be updated during initialization
+                    type: 'float32',
+                    baseUrl: ollamaBaseUrl
+                });
+
+                // Register the provider
+                registerEmbeddingProvider(ollamaProvider);
+
+                // Initialize the provider to detect model capabilities
+                await ollamaProvider.initialize();
+
+                // Create Ollama provider config if it doesn't exist
+                const existingOllama = await sql.getRow(
+                    "SELECT * FROM embedding_providers WHERE name = ?",
+                    ['ollama']
+                );
+
+                if (!existingOllama) {
+                    await createEmbeddingProviderConfig('ollama', {
+                        model: embeddingModel,
+                        dimension: ollamaProvider.getDimension(),
+                        type: 'float32'
+                    }, 50);
+                }
+            } catch (error: any) {
+                log.error(`Error initializing Ollama embedding provider: ${error.message || 'Unknown error'}`);
+            }
+        }
+
+        // Always register local provider as fallback
+        registerEmbeddingProvider(new SimpleLocalEmbeddingProvider({
+            model: 'local',
+            dimension: 384,
+            type: 'float32'
+        }));
+
+        // Create local provider config if it doesn't exist
+        const existingLocal = await sql.getRow(
+            "SELECT * FROM embedding_providers WHERE name = ?",
+            ['local']
+        );
+
+        if (!existingLocal) {
+            await createEmbeddingProviderConfig('local', {
+                model: 'local',
+                dimension: 384,
+                type: 'float32'
+            }, 10);
+        }
+    } catch (error: any) {
+        log.error(`Error initializing default embedding providers: ${error.message || 'Unknown error'}`);
+    }
+}
+
+export default {
+    registerEmbeddingProvider,
+    getEmbeddingProviders,
+    getEmbeddingProvider,
+    getEnabledEmbeddingProviders,
+    createEmbeddingProviderConfig,
+    updateEmbeddingProviderConfig,
+    deleteEmbeddingProviderConfig,
+    getEmbeddingProviderConfigs,
+    initializeDefaultProviders
+};
+
+/**
+ * Get OpenAI provider options from chat options and configuration
+ * Updated to use provider metadata approach
+ */
+export function getOpenAIOptions(
+    opts: ChatCompletionOptions = {}
+): OpenAIOptions {
+    try {
+        const apiKey = options.getOption('openaiApiKey');
+        if (!apiKey) {
+            throw new Error('OpenAI API key is not configured');
+        }
+
+        const baseUrl = options.getOption('openaiBaseUrl') || PROVIDER_CONSTANTS.OPENAI.BASE_URL;
+        const modelName = opts.model || options.getOption('openaiDefaultModel') || PROVIDER_CONSTANTS.OPENAI.DEFAULT_MODEL;
+
+        // Create provider metadata
+        const providerMetadata: ModelMetadata = {
+            provider: 'openai',
+            modelId: modelName,
+            displayName: modelName,
+            capabilities: {
+                supportsTools: modelName.includes('gpt-4') || modelName.includes('gpt-3.5-turbo'),
+                supportsVision: modelName.includes('vision') || modelName.includes('gpt-4-turbo') || modelName.includes('gpt-4o'),
+                supportsStreaming: true
+            }
+        };
+
+        // Get temperature from options or global setting
+        const temperature = opts.temperature !== undefined
+            ? opts.temperature
+            : parseFloat(options.getOption('aiTemperature') || String(SEARCH_CONSTANTS.TEMPERATURE.DEFAULT));
+
+        return {
+            // Connection settings
+            apiKey,
+            baseUrl,
+
+            // Provider metadata
+            providerMetadata,
+
+            // API parameters
+            model: modelName,
+            temperature,
+            max_tokens: opts.maxTokens,
+            stream: opts.stream,
+            top_p: opts.topP,
+            frequency_penalty: opts.frequencyPenalty,
+            presence_penalty: opts.presencePenalty,
+            tools: opts.tools,
+
+            // Internal configuration
+            systemPrompt: opts.systemPrompt,
+            enableTools: opts.enableTools,
+        };
+    } catch (error) {
+        log.error(`Error creating OpenAI provider options: ${error}`);
+        throw error;
+    }
+}
+
+/**
+ * Get Anthropic provider options from chat options and configuration
+ * Updated to use provider metadata approach
+ */
+export function getAnthropicOptions(
+    opts: ChatCompletionOptions = {}
+): AnthropicOptions {
+    try {
+        const apiKey = options.getOption('anthropicApiKey');
+        if (!apiKey) {
+            throw new Error('Anthropic API key is not configured');
+        }
+
+        const baseUrl = options.getOption('anthropicBaseUrl') || PROVIDER_CONSTANTS.ANTHROPIC.BASE_URL;
+        const modelName = opts.model || options.getOption('anthropicDefaultModel') || PROVIDER_CONSTANTS.ANTHROPIC.DEFAULT_MODEL;
+
+        // Create provider metadata
+        const providerMetadata: ModelMetadata = {
+            provider: 'anthropic',
+            modelId: modelName,
+            displayName: modelName,
+            capabilities: {
+                supportsTools: modelName.includes('claude-3') || modelName.includes('claude-3.5'),
+                supportsVision: modelName.includes('claude-3') || modelName.includes('claude-3.5'),
+                supportsStreaming: true,
+                // Anthropic models typically have large context windows
+                contextWindow: modelName.includes('claude-3-opus') ? 200000 :
+                    modelName.includes('claude-3-sonnet') ? 180000 :
+                        modelName.includes('claude-3.5-sonnet') ? 200000 : 100000
+            }
+        };
+
+        // Get temperature from options or global setting
+        const temperature = opts.temperature !== undefined
+            ? opts.temperature
+            : parseFloat(options.getOption('aiTemperature') || String(SEARCH_CONSTANTS.TEMPERATURE.DEFAULT));
+
+        return {
+            // Connection settings
+            apiKey,
+            baseUrl,
+            apiVersion: PROVIDER_CONSTANTS.ANTHROPIC.API_VERSION,
+            betaVersion: PROVIDER_CONSTANTS.ANTHROPIC.BETA_VERSION,
+
+            // Provider metadata
+            providerMetadata,
+
+            // API parameters
+            model: modelName,
+            temperature,
+            max_tokens: opts.maxTokens,
+            stream: opts.stream,
+            top_p: opts.topP,
+
+            // Internal configuration
+            systemPrompt: opts.systemPrompt
+        };
+    } catch (error) {
+        log.error(`Error creating Anthropic provider options: ${error}`);
+        throw error;
+    }
+}
+
+/**
+ * Get Ollama provider options from chat options and configuration
+ * This implementation cleanly separates provider information from model names
+ */
+export async function getOllamaOptions(
+    opts: ChatCompletionOptions = {},
+    contextWindow?: number
+): Promise<OllamaOptions> {
+    try {
+        const baseUrl = options.getOption('ollamaBaseUrl');
+        if (!baseUrl) {
+            throw new Error('Ollama API URL is not configured');
+        }
+
+        // Get the model name - no prefix handling needed now
+        let modelName = opts.model || options.getOption('ollamaDefaultModel') || 'llama3';
+
+        // Create provider metadata
+        const providerMetadata: ModelMetadata = {
+            provider: 'ollama',
+            modelId: modelName,
+            capabilities: {
+                supportsTools: true,
+                supportsStreaming: true
+            }
+        };
+
+        // Get temperature from options or global setting
+        const temperature = opts.temperature !== undefined
+            ? opts.temperature
+            : parseFloat(options.getOption('aiTemperature') || String(SEARCH_CONSTANTS.TEMPERATURE.DEFAULT));
+
+        // Use provided context window or get from model if not specified
+        const modelContextWindow = contextWindow || await getOllamaModelContextWindow(modelName);
+
+        // Update capabilities with context window information
+        providerMetadata.capabilities!.contextWindow = modelContextWindow;
+
+        return {
+            // Connection settings
+            baseUrl,
+
+            // Provider metadata
+            providerMetadata,
+
+            // API parameters
+            model: modelName,  // Clean model name without provider prefix
+            stream: opts.stream !== undefined ? opts.stream : true, // Default to true if not specified
+            options: {
+                temperature: opts.temperature,
+                num_ctx: modelContextWindow,
+                num_predict: opts.maxTokens,
+                response_format: opts.expectsJsonResponse ? { type: "json_object" } : undefined
+            },
+            tools: opts.tools,
+
+            // Internal configuration
+            systemPrompt: opts.systemPrompt,
+            enableTools: opts.enableTools,
+            bypassFormatter: opts.bypassFormatter,
+            preserveSystemPrompt: opts.preserveSystemPrompt,
+            expectsJsonResponse: opts.expectsJsonResponse,
+            toolExecutionStatus: opts.toolExecutionStatus,
+        };
+    } catch (error) {
+        log.error(`Error creating Ollama provider options: ${error}`);
+        throw error;
+    }
+}
+
+/**
+ * Get context window size for Ollama model using the official client
+ */
+async function getOllamaModelContextWindow(modelName: string): Promise<number> {
+    try {
+        const baseUrl = options.getOption('ollamaBaseUrl');
+
+        if (!baseUrl) {
+            throw new Error('Ollama base URL is not configured');
+        }
+
+        // Use the official Ollama client
+        const { Ollama } = await import('ollama');
+        const client = new Ollama({ host: baseUrl });
+
+        // Try to get model information from Ollama API
+        const modelData = await client.show({ model: modelName });
+
+        // Get context window from model parameters
+        if (modelData && modelData.parameters) {
+            const params = modelData.parameters as any;
+            if (params.num_ctx) {
+                return params.num_ctx;
+            }
+        }
+
+        // Default context sizes by model family if we couldn't get specific info
+        if (modelName.includes('llama3')) {
+            return MODEL_CAPABILITIES['gpt-4'].contextWindowTokens;
+        } else if (modelName.includes('llama2')) {
+            return MODEL_CAPABILITIES['default'].contextWindowTokens;
+        } else if (modelName.includes('mistral') || modelName.includes('mixtral')) {
+            return MODEL_CAPABILITIES['gpt-4'].contextWindowTokens;
+        } else if (modelName.includes('gemma')) {
+            return MODEL_CAPABILITIES['gpt-4'].contextWindowTokens;
+        }
+
+        // Return a reasonable default
+        return MODEL_CAPABILITIES['default'].contextWindowTokens;
+    } catch (error) {
+        log.info(`Error getting context window for model ${modelName}: ${error}`);
+        return MODEL_CAPABILITIES['default'].contextWindowTokens; // Default fallback
+    }
+}
diff --git a/src/services/llm/providers/stream_handler.ts b/src/services/llm/providers/stream_handler.ts
new file mode 100644
index 000000000..cbc6e2bb8
--- /dev/null
+++ b/src/services/llm/providers/stream_handler.ts
@@ -0,0 +1,406 @@
+/**
+ * Stream Handler - Reusable streaming implementation for LLM providers
+ *
+ * This module provides common streaming utilities that can be used by any LLM provider.
+ * It abstracts the complexities of handling streaming responses and tool executions.
+ */
+
+import type { StreamChunk as BaseStreamChunk, ChatCompletionOptions } from '../ai_interface.js';
+import log from '../../log.js';
+
+/**
+ * Extended StreamChunk interface that makes 'done' optional for internal use
+ */
+export interface StreamChunk extends Omit<BaseStreamChunk, 'done'> {
+    done?: boolean;
+}
+
+/**
+ * Stream processing options
+ */
+export interface StreamProcessingOptions {
+    streamCallback?: (text: string, done: boolean, chunk?: any) => Promise<void> | void;
+    providerName: string;
+    modelName: string;
+}
+
+/**
+ * Stream processor that handles common streaming operations
+ */
+export class StreamProcessor {
+    /**
+     * Process an individual chunk from a streaming response
+     */
+    static async processChunk(
+        chunk: any,
+        completeText: string,
+        chunkCount: number,
+        options: StreamProcessingOptions
+    ): Promise<{completeText: string, logged: boolean}> {
+        let textToAdd = '';
+        let logged = false;
+
+        // Enhanced logging for content chunks and completion status
+        if (chunkCount === 1 || chunkCount % 10 === 0 || chunk.done) {
+            log.info(`Processing ${options.providerName} stream chunk #${chunkCount}, done=${!!chunk.done}, has content=${!!chunk.message?.content}, content length=${chunk.message?.content?.length || 0}`);
+            logged = true;
+        }
+
+        // Extract content if available
+        if (chunk.message?.content) {
+            textToAdd = chunk.message.content;
+            const newCompleteText = completeText + textToAdd;
+
+            if (chunkCount === 1) {
+                // Log the first chunk more verbosely for debugging
+                log.info(`First content chunk [${chunk.message.content.length} chars]: "${textToAdd.substring(0, 100)}${textToAdd.length > 100 ? '...' : ''}"`);
+            }
+
+            // For final chunks with done=true, log more information
+            if (chunk.done) {
+                log.info(`Final content chunk received with done=true flag. Length: ${chunk.message.content.length}`);
+            }
+
+            return { completeText: newCompleteText, logged };
+        } else if (chunk.done) {
+            // If it's the final chunk with no content, log this case
+            log.info(`Empty final chunk received with done=true flag`);
+        }
+
+        return { completeText, logged };
+    }
+
+    /**
+     * Send a streaming chunk to the callback
+     */
+    static async sendChunkToCallback(
+        callback: (text: string, done: boolean, chunk?: any) => Promise<void> | void,
+        content: string,
+        done: boolean,
+        chunk: any,
+        chunkNumber: number
+    ): Promise<void> {
+        try {
+            // Log all done=true callbacks and first chunk for debugging
+            if (done || chunkNumber === 1) {
+                log.info(`Sending chunk to callback: chunkNumber=${chunkNumber}, contentLength=${content?.length || 0}, done=${done}`);
+            }
+
+            // Always make sure we have a string for content
+            const safeContent = content || '';
+
+            const result = callback(safeContent, done, chunk);
+            // Handle both Promise and void return types
+            if (result instanceof Promise) {
+                await result;
+            }
+
+            if (chunkNumber === 1) {
+                log.info(`Successfully called streamCallback with first chunk`);
+            }
+
+            if (done) {
+                log.info(`Successfully called streamCallback with done=true flag`);
+            }
+        } catch (callbackError) {
+            log.error(`Error in streamCallback: ${callbackError}`);
+        }
+    }
+
+    /**
+     * Send final completion callback
+     */
+    static async sendFinalCallback(
+        callback: (text: string, done: boolean, chunk?: any) => Promise<void> | void,
+        completeText: string
+    ): Promise<void> {
+        try {
+            log.info(`Sending explicit final done=true callback after processing all chunks. Complete text length: ${completeText?.length || 0}`);
+
+            // Pass the complete text instead of empty string for better UX
+            // The client will know it's done based on the done=true flag
+            const result = callback(completeText || '', true, { done: true, complete: true });
+
+            // Handle both Promise and void return types
+            if (result instanceof Promise) {
+                await result;
+            }
+
+            log.info(`Final callback sent successfully with done=true flag`);
+        } catch (finalCallbackError) {
+            log.error(`Error in final streamCallback: ${finalCallbackError}`);
+        }
+    }
+
+    /**
+     * Detect and extract tool calls from a response chunk
+     */
+    static extractToolCalls(chunk: any): any[] {
+        if (chunk.message?.tool_calls &&
+            Array.isArray(chunk.message.tool_calls) &&
+            chunk.message.tool_calls.length > 0) {
+
+            log.info(`Detected ${chunk.message.tool_calls.length} tool calls in stream chunk`);
+            return [...chunk.message.tool_calls];
+        }
+
+        return [];
+    }
+
+    /**
+     * Create a standard response object from streaming results
+     */
+    static createFinalResponse(
+        completeText: string,
+        modelName: string,
+        providerName: string,
+        toolCalls: any[],
+        usage: any = {}
+    ) {
+        return {
+            text: completeText,
+            model: modelName,
+            provider: providerName,
+            tool_calls: toolCalls,
+            usage
+        };
+    }
+}
+
+/**
+ * Create a streaming handler that follows a consistent pattern
+ */
+export function createStreamHandler(
+    options: StreamProcessingOptions,
+    processFn: (
+        callback: (chunk: StreamChunk) => Promise<void> | void
+    ) => Promise<string>
+): (callback: (chunk: StreamChunk) => Promise<void> | void) => Promise<string> {
+    return async (callback) => {
+        let chunkCount = 0;
+
+        try {
+            // Run the processor function with our callback
+            return await processFn(async (chunk) => {
+                chunkCount++;
+
+                // Pass each chunk directly to the callback as it arrives
+                // without modifying or accumulating its content
+                await callback({
+                    text: chunk.text,
+                    done: true,
+                    tool_calls: chunk.tool_calls,
+                    raw: typeof chunk.raw === 'object' ?
+                        chunk.raw as Record<string, unknown> :
+                        { data: chunk.raw } as Record<string, unknown> // Include raw data
+                });
+            });
+        } catch (error) {
+            log.error(`Error in stream handler: ${error}`);
+            throw error;
+        } finally {
+            // Always ensure a final done=true chunk is sent
+            if (chunkCount > 0) {
+                try {
+                    await callback({
+                        text: '',
+                        done: true
+                    });
+                } catch (e) {
+                    log.error(`Error sending final chunk: ${e}`);
+                }
+            }
+        }
+    };
+}
+
+/**
+ * Interface for provider-specific stream options
+ */
+export interface ProviderStreamOptions {
+    providerName: string;
+    modelName: string;
+    apiConfig?: any;
+}
+
+/**
+ * Interface for streaming response stats
+ */
+export interface StreamStats {
+    promptTokens?: number;
+    completionTokens?: number;
+    totalTokens?: number;
+}
+
+/**
+ * Perform a health check against an API endpoint
+ * @param checkFn Function that performs the actual health check API call
+ * @param providerName Name of the provider for logging
+ * @returns Promise resolving to true if healthy, or throwing an error if not
+ */
+export async function performProviderHealthCheck(
+    checkFn: () => Promise<any>,
+    providerName: string
+): Promise<boolean> {
+    try {
+        log.info(`Performing ${providerName} health check...`);
+        const healthResponse = await checkFn();
+        log.info(`${providerName} health check successful`);
+        return true;
+    } catch (healthError) {
+        log.error(`${providerName} health check failed: ${healthError instanceof Error ? healthError.message : String(healthError)}`);
+        throw new Error(`Unable to connect to ${providerName} server: ${healthError instanceof Error ? healthError.message : String(healthError)}`);
+    }
+}
+
+/**
+ * Process a stream from an LLM provider using a callback-based approach
+ * @param streamIterator Async iterator returned from the provider's API
+ * @param options Provider information and configuration
+ * @param streamCallback Optional callback function for streaming updates
+ * @returns Promise resolving to the complete response including text and tool calls
+ */
+export async function processProviderStream(
+    streamIterator: AsyncIterable<any>,
+    options: ProviderStreamOptions,
+    streamCallback?: (text: string, done: boolean, chunk?: any) => Promise<void> | void
+): Promise<{
+    completeText: string;
+    toolCalls: any[];
+    finalChunk: any | null;
+    chunkCount: number;
+}> {
+    let completeText = '';
+    let responseToolCalls: any[] = [];
+    let finalChunk: any | null = null;
+    let chunkCount = 0;
+
+    try {
+        log.info(`Starting ${options.providerName} stream processing with model ${options.modelName}`);
+
+        // Validate stream iterator
+        if (!streamIterator || typeof streamIterator[Symbol.asyncIterator] !== 'function') {
+            log.error(`Invalid stream iterator returned from ${options.providerName}`);
+            throw new Error(`Invalid stream iterator returned from ${options.providerName}`);
+        }
+
+        // Process each chunk
+        for await (const chunk of streamIterator) {
+            chunkCount++;
+            finalChunk = chunk;
+
+            // Process chunk with StreamProcessor
+            const result = await StreamProcessor.processChunk(
+                chunk,
+                completeText,
+                chunkCount,
+                { providerName: options.providerName, modelName: options.modelName }
+            );
+
+            completeText = result.completeText;
+
+            // Extract tool calls
+            const toolCalls = StreamProcessor.extractToolCalls(chunk);
+            if (toolCalls.length > 0) {
+                responseToolCalls = toolCalls;
+            }
+
+            // Call the callback with the current chunk content if provided
+            if (streamCallback) {
+                // For chunks with content, send the content directly
+                const contentProperty = getChunkContentProperty(chunk);
+                if (contentProperty) {
+                    await StreamProcessor.sendChunkToCallback(
+                        streamCallback,
+                        contentProperty,
+                        !!chunk.done, // Mark as done if done flag is set
+                        chunk,
+                        chunkCount
+                    );
+                } else if (chunk.done) {
+                    // Send empty done message for final chunk with no content
+                    await StreamProcessor.sendChunkToCallback(
+                        streamCallback,
+                        '',
+                        true,
+                        chunk,
+                        chunkCount
+                    );
+                }
+            }
+
+            // Log final chunk
+            if (chunk.done && !result.logged) {
+                log.info(`Reached final chunk (done=true) after ${chunkCount} chunks, total content length: ${completeText.length}`);
+            }
+        }
+
+        // Send one final callback with done=true if the last chunk didn't have done=true
+        if (streamCallback && (!finalChunk || !finalChunk.done)) {
+            log.info(`Sending explicit final callback with done=true flag after all chunks processed`);
+            await StreamProcessor.sendFinalCallback(streamCallback, completeText);
+        }
+
+        log.info(`Completed ${options.providerName} streaming: processed ${chunkCount} chunks, final content: ${completeText.length} chars`);
+
+        return {
+            completeText,
+            toolCalls: responseToolCalls,
+            finalChunk,
+            chunkCount
+        };
+    } catch (error) {
+        log.error(`Error in ${options.providerName} stream processing: ${error instanceof Error ? error.message : String(error)}`);
+        log.error(`Error details: ${error instanceof Error ? error.stack : 'No stack trace available'}`);
+        throw error;
+    }
+}
+
+/**
+ * Helper function to extract content from a chunk based on provider's response format
+ * Different providers may have different chunk structures
+ */
+function getChunkContentProperty(chunk: any): string | null {
+    // Check common content locations in different provider responses
+    if (chunk.message?.content) {
+        return chunk.message.content;
+    }
+    if (chunk.content) {
+        return chunk.content;
+    }
+    if (chunk.choices?.[0]?.delta?.content) {
+        return chunk.choices[0].delta.content;
+    }
+    return null;
+}
+
+/**
+ * Extract usage statistics from the final chunk based on provider format
+ */
+export function extractStreamStats(finalChunk: any | null, providerName: string): StreamStats {
+    // Handle provider-specific response formats
+    if (!finalChunk) {
+        return { promptTokens: 0, completionTokens: 0, totalTokens: 0 };
+    }
+
+    // Ollama format
+    if (finalChunk.prompt_eval_count !== undefined && finalChunk.eval_count !== undefined) {
+        return {
+            promptTokens: finalChunk.prompt_eval_count || 0,
+            completionTokens: finalChunk.eval_count || 0,
+            totalTokens: (finalChunk.prompt_eval_count || 0) + (finalChunk.eval_count || 0)
+        };
+    }
+
+    // OpenAI-like format
+    if (finalChunk.usage) {
+        return {
+            promptTokens: finalChunk.usage.prompt_tokens || 0,
+            completionTokens: finalChunk.usage.completion_tokens || 0,
+            totalTokens: finalChunk.usage.total_tokens || 0
+        };
+    }
+
+    log.info(`No standard token usage found in ${providerName} final chunk`);
+    return { promptTokens: 0, completionTokens: 0, totalTokens: 0 };
+}
diff --git a/src/services/llm/rest_chat_service.ts b/src/services/llm/rest_chat_service.ts
new file mode 100644
index 000000000..1cc6f56ba
--- /dev/null
+++ b/src/services/llm/rest_chat_service.ts
@@ -0,0 +1,10 @@
+/**
+ * REST Chat Service
+ *
+ * This file is a wrapper for the modular implementation in the chat/ directory.
+ * See chat/rest-chat-service.ts for the actual implementation.
+ */
+
+import restChatService from './chat/rest_chat_service.js';
+export * from './interfaces/chat_session.js';
+export default restChatService;
diff --git a/src/services/llm/tools/attribute_manager_tool.ts b/src/services/llm/tools/attribute_manager_tool.ts
new file mode 100644
index 000000000..72032ac57
--- /dev/null
+++ b/src/services/llm/tools/attribute_manager_tool.ts
@@ -0,0 +1,258 @@
+/**
+ * Attribute Manager Tool
+ *
+ * This tool allows the LLM to add, remove, or modify note attributes in Trilium.
+ */
+
+import type { Tool, ToolHandler } from './tool_interfaces.js';
+import log from '../../log.js';
+import becca from '../../../becca/becca.js';
+import attributes from '../../attributes.js';
+
+// Define a custom error type guard
+function isError(error: unknown): error is Error {
+    return error instanceof Error || (typeof error === 'object' &&
+           error !== null && 'message' in error);
+}
+
+/**
+ * Definition of the attribute manager tool
+ */
+export const attributeManagerToolDefinition: Tool = {
+    type: 'function',
+    function: {
+        name: 'manage_attributes',
+        description: 'Add, remove, or modify attributes (labels/relations) on a note',
+        parameters: {
+            type: 'object',
+            properties: {
+                noteId: {
+                    type: 'string',
+                    description: 'System ID of the note to manage attributes for (not the title). This is a unique identifier like "abc123def456".'
+                },
+                action: {
+                    type: 'string',
+                    description: 'Action to perform on the attribute',
+                    enum: ['add', 'remove', 'update', 'list']
+                },
+                attributeName: {
+                    type: 'string',
+                    description: 'Name of the attribute (e.g., "#tag" for a label, or "relation" for a relation)'
+                },
+                attributeValue: {
+                    type: 'string',
+                    description: 'Value of the attribute (for add/update actions). Not needed for label-type attributes.'
+                }
+            },
+            required: ['noteId', 'action']
+        }
+    }
+};
+
+/**
+ * Attribute manager tool implementation
+ */
+export class AttributeManagerTool implements ToolHandler {
+    public definition: Tool = attributeManagerToolDefinition;
+
+    /**
+     * Execute the attribute manager tool
+     */
+    public async execute(args: { noteId: string, action: string, attributeName?: string, attributeValue?: string }): Promise<string | object> {
+        try {
+            const { noteId, action, attributeName, attributeValue } = args;
+
+            log.info(`Executing manage_attributes tool - NoteID: "${noteId}", Action: ${action}, AttributeName: ${attributeName || 'not specified'}`);
+
+            // Get the note from becca
+            const note = becca.notes[noteId];
+
+            if (!note) {
+                log.info(`Note with ID ${noteId} not found - returning error`);
+                return `Error: Note with ID ${noteId} not found`;
+            }
+
+            log.info(`Found note: "${note.title}" (Type: ${note.type})`);
+
+            // List all existing attributes
+            if (action === 'list') {
+                const noteAttributes = note.getOwnedAttributes();
+                log.info(`Listing ${noteAttributes.length} attributes for note "${note.title}"`);
+
+                const formattedAttributes = noteAttributes.map(attr => ({
+                    name: attr.name,
+                    value: attr.value,
+                    type: attr.type
+                }));
+
+                return {
+                    success: true,
+                    noteId: note.noteId,
+                    title: note.title,
+                    attributeCount: noteAttributes.length,
+                    attributes: formattedAttributes
+                };
+            }
+
+            // For other actions, attribute name is required
+            if (!attributeName) {
+                return 'Error: attributeName is required for add, remove, and update actions';
+            }
+
+            // Perform the requested action
+            if (action === 'add') {
+                // Add a new attribute
+                try {
+                    const startTime = Date.now();
+
+                    // For label-type attributes (starting with #), no value is needed
+                    const isLabel = attributeName.startsWith('#');
+                    const value = isLabel ? '' : (attributeValue || '');
+
+                    // Check if attribute already exists
+                    const existingAttrs = note.getOwnedAttributes()
+                        .filter(attr => attr.name === attributeName && attr.value === value);
+
+                    if (existingAttrs.length > 0) {
+                        log.info(`Attribute ${attributeName}=${value} already exists on note "${note.title}"`);
+                        return {
+                            success: false,
+                            message: `Attribute ${attributeName}=${value || ''} already exists on note "${note.title}"`
+                        };
+                    }
+
+                    // Create the attribute
+                    await attributes.createLabel(noteId, attributeName, value);
+                    const duration = Date.now() - startTime;
+
+                    log.info(`Added attribute ${attributeName}=${value || ''} in ${duration}ms`);
+                    return {
+                        success: true,
+                        noteId: note.noteId,
+                        title: note.title,
+                        action: 'add',
+                        attributeName: attributeName,
+                        attributeValue: value,
+                        message: `Added attribute ${attributeName}=${value || ''} to note "${note.title}"`
+                    };
+                } catch (error: unknown) {
+                    const errorMessage = isError(error) ? error.message : String(error);
+                    log.error(`Error adding attribute: ${errorMessage}`);
+                    return `Error: ${errorMessage}`;
+                }
+            } else if (action === 'remove') {
+                // Remove an attribute
+                try {
+                    const startTime = Date.now();
+
+                    // Find the attribute to remove
+                    const attributesToRemove = note.getOwnedAttributes()
+                        .filter(attr => attr.name === attributeName &&
+                                        (attributeValue === undefined || attr.value === attributeValue));
+
+                    if (attributesToRemove.length === 0) {
+                        log.info(`Attribute ${attributeName} not found on note "${note.title}"`);
+                        return {
+                            success: false,
+                            message: `Attribute ${attributeName} not found on note "${note.title}"`
+                        };
+                    }
+
+                    // Remove all matching attributes
+                    for (const attr of attributesToRemove) {
+                        // Delete attribute by recreating it with isDeleted flag
+                        const attrToDelete = {
+                            attributeId: attr.attributeId,
+                            noteId: attr.noteId,
+                            type: attr.type,
+                            name: attr.name,
+                            value: attr.value,
+                            isDeleted: true,
+                            position: attr.position,
+                            utcDateModified: new Date().toISOString()
+                        };
+                        await attributes.createAttribute(attrToDelete);
+                    }
+
+                    const duration = Date.now() - startTime;
+                    log.info(`Removed ${attributesToRemove.length} attribute(s) in ${duration}ms`);
+
+                    return {
+                        success: true,
+                        noteId: note.noteId,
+                        title: note.title,
+                        action: 'remove',
+                        attributeName: attributeName,
+                        attributesRemoved: attributesToRemove.length,
+                        message: `Removed ${attributesToRemove.length} attribute(s) from note "${note.title}"`
+                    };
+                } catch (error: unknown) {
+                    const errorMessage = isError(error) ? error.message : String(error);
+                    log.error(`Error removing attribute: ${errorMessage}`);
+                    return `Error: ${errorMessage}`;
+                }
+            } else if (action === 'update') {
+                // Update an attribute
+                try {
+                    const startTime = Date.now();
+
+                    if (attributeValue === undefined) {
+                        return 'Error: attributeValue is required for update action';
+                    }
+
+                    // Find the attribute to update
+                    const attributesToUpdate = note.getOwnedAttributes()
+                        .filter(attr => attr.name === attributeName);
+
+                    if (attributesToUpdate.length === 0) {
+                        log.info(`Attribute ${attributeName} not found on note "${note.title}"`);
+                        return {
+                            success: false,
+                            message: `Attribute ${attributeName} not found on note "${note.title}"`
+                        };
+                    }
+
+                    // Update all matching attributes
+                    for (const attr of attributesToUpdate) {
+                        // Update by recreating with the same ID but new value
+                        const attrToUpdate = {
+                            attributeId: attr.attributeId,
+                            noteId: attr.noteId,
+                            type: attr.type,
+                            name: attr.name,
+                            value: attributeValue,
+                            isDeleted: false,
+                            position: attr.position,
+                            utcDateModified: new Date().toISOString()
+                        };
+                        await attributes.createAttribute(attrToUpdate);
+                    }
+
+                    const duration = Date.now() - startTime;
+                    log.info(`Updated ${attributesToUpdate.length} attribute(s) in ${duration}ms`);
+
+                    return {
+                        success: true,
+                        noteId: note.noteId,
+                        title: note.title,
+                        action: 'update',
+                        attributeName: attributeName,
+                        attributeValue: attributeValue,
+                        attributesUpdated: attributesToUpdate.length,
+                        message: `Updated ${attributesToUpdate.length} attribute(s) on note "${note.title}"`
+                    };
+                } catch (error: unknown) {
+                    const errorMessage = isError(error) ? error.message : String(error);
+                    log.error(`Error updating attribute: ${errorMessage}`);
+                    return `Error: ${errorMessage}`;
+                }
+            } else {
+                return `Error: Unsupported action "${action}". Supported actions are: add, remove, update, list`;
+            }
+        } catch (error: unknown) {
+            const errorMessage = isError(error) ? error.message : String(error);
+            log.error(`Error executing manage_attributes tool: ${errorMessage}`);
+            return `Error: ${errorMessage}`;
+        }
+    }
+}
diff --git a/src/services/llm/tools/attribute_search_tool.ts b/src/services/llm/tools/attribute_search_tool.ts
new file mode 100644
index 000000000..6d6bdaff6
--- /dev/null
+++ b/src/services/llm/tools/attribute_search_tool.ts
@@ -0,0 +1,156 @@
+/**
+ * Attribute Search Tool
+ *
+ * This tool allows the LLM to search for notes based specifically on attributes.
+ * It's specialized for finding notes with specific labels or relations.
+ */
+
+import type { Tool, ToolHandler } from './tool_interfaces.js';
+import log from '../../log.js';
+import attributes from '../../attributes.js';
+import searchService from '../../search/services/search.js';
+import attributeFormatter from '../../attribute_formatter.js';
+import type BNote from '../../../becca/entities/bnote.js';
+
+/**
+ * Definition of the attribute search tool
+ */
+export const attributeSearchToolDefinition: Tool = {
+    type: 'function',
+    function: {
+        name: 'attribute_search',
+        description: 'Search for notes with specific attributes (labels or relations). Use this when you need to find notes based on their metadata rather than content.',
+        parameters: {
+            type: 'object',
+            properties: {
+                attributeType: {
+                    type: 'string',
+                    description: 'Type of attribute to search for: "label" or "relation"',
+                    enum: ['label', 'relation']
+                },
+                attributeName: {
+                    type: 'string',
+                    description: 'Name of the attribute to search for'
+                },
+                attributeValue: {
+                    type: 'string',
+                    description: 'Optional value of the attribute. If not provided, will find all notes with the given attribute name.'
+                },
+                maxResults: {
+                    type: 'number',
+                    description: 'Maximum number of results to return (default: 20)'
+                }
+            },
+            required: ['attributeType', 'attributeName']
+        }
+    }
+};
+
+/**
+ * Attribute search tool implementation
+ */
+export class AttributeSearchTool implements ToolHandler {
+    public definition: Tool = attributeSearchToolDefinition;
+
+    /**
+     * Execute the attribute search tool
+     */
+    public async execute(args: { attributeType: string, attributeName: string, attributeValue?: string, maxResults?: number }): Promise<string | object> {
+        try {
+            const { attributeType, attributeName, attributeValue, maxResults = 20 } = args;
+
+            log.info(`Executing attribute_search tool - Type: "${attributeType}", Name: "${attributeName}", Value: "${attributeValue || 'any'}", MaxResults: ${maxResults}`);
+
+            // Validate attribute type
+            if (attributeType !== 'label' && attributeType !== 'relation') {
+                return `Error: Invalid attribute type. Must be either "label" or "relation".`;
+            }
+
+            // Execute the search
+            log.info(`Searching for notes with ${attributeType}: ${attributeName}${attributeValue ? ' = ' + attributeValue : ''}`);
+            const searchStartTime = Date.now();
+
+            let results: BNote[] = [];
+
+            if (attributeType === 'label') {
+                // For labels, we can use the existing getNotesWithLabel function
+                results = attributes.getNotesWithLabel(attributeName, attributeValue);
+            } else {
+                // For relations, we need to build a search query
+                const query = attributeFormatter.formatAttrForSearch({
+                    type: "relation",
+                    name: attributeName,
+                    value: attributeValue
+                }, attributeValue !== undefined);
+
+                results = searchService.searchNotes(query, {
+                    includeArchivedNotes: true,
+                    ignoreHoistedNote: true
+                });
+            }
+
+            // Limit results
+            const limitedResults = results.slice(0, maxResults);
+
+            const searchDuration = Date.now() - searchStartTime;
+
+            log.info(`Attribute search completed in ${searchDuration}ms, found ${results.length} matching notes, returning ${limitedResults.length}`);
+
+            if (limitedResults.length > 0) {
+                // Log top results
+                limitedResults.slice(0, 3).forEach((note: BNote, index: number) => {
+                    log.info(`Result ${index + 1}: "${note.title}"`);
+                });
+            } else {
+                log.info(`No notes found with ${attributeType} "${attributeName}"${attributeValue ? ' = ' + attributeValue : ''}`);
+            }
+
+            // Format the results
+            return {
+                count: limitedResults.length,
+                totalFound: results.length,
+                attributeType,
+                attributeName,
+                attributeValue,
+                results: limitedResults.map((note: BNote) => {
+                    // Get relevant attributes of this type
+                    const relevantAttributes = note.getOwnedAttributes()
+                        .filter(attr => attr.type === attributeType && attr.name === attributeName)
+                        .map(attr => ({
+                            type: attr.type,
+                            name: attr.name,
+                            value: attr.value
+                        }));
+
+                    // Get a preview of the note content
+                    let contentPreview = '';
+                    try {
+                        const content = note.getContent();
+                        if (typeof content === 'string') {
+                            contentPreview = content.length > 150 ? content.substring(0, 150) + '...' : content;
+                        } else if (Buffer.isBuffer(content)) {
+                            contentPreview = '[Binary content]';
+                        } else {
+                            contentPreview = String(content).substring(0, 150) + (String(content).length > 150 ? '...' : '');
+                        }
+                    } catch (e) {
+                        contentPreview = '[Content not available]';
+                    }
+
+                    return {
+                        noteId: note.noteId,
+                        title: note.title,
+                        preview: contentPreview,
+                        relevantAttributes: relevantAttributes,
+                        type: note.type,
+                        dateCreated: note.dateCreated,
+                        dateModified: note.dateModified
+                    };
+                })
+            };
+        } catch (error: any) {
+            log.error(`Error executing attribute_search tool: ${error.message || String(error)}`);
+            return `Error: ${error.message || String(error)}`;
+        }
+    }
+}
diff --git a/src/services/llm/tools/calendar_integration_tool.ts b/src/services/llm/tools/calendar_integration_tool.ts
new file mode 100644
index 000000000..d11bec39c
--- /dev/null
+++ b/src/services/llm/tools/calendar_integration_tool.ts
@@ -0,0 +1,482 @@
+/**
+ * Calendar Integration Tool
+ *
+ * This tool allows the LLM to find date-related notes or create date-based entries.
+ */
+
+import type { Tool, ToolHandler } from './tool_interfaces.js';
+import log from '../../log.js';
+import becca from '../../../becca/becca.js';
+import notes from '../../notes.js';
+import attributes from '../../attributes.js';
+import dateNotes from '../../date_notes.js';
+
+/**
+ * Definition of the calendar integration tool
+ */
+export const calendarIntegrationToolDefinition: Tool = {
+    type: 'function',
+    function: {
+        name: 'calendar_integration',
+        description: 'Find date-related notes or create date-based entries',
+        parameters: {
+            type: 'object',
+            properties: {
+                action: {
+                    type: 'string',
+                    description: 'Action to perform',
+                    enum: ['find_date_notes', 'create_date_note', 'find_notes_with_date_range', 'get_daily_note']
+                },
+                date: {
+                    type: 'string',
+                    description: 'Date in ISO format (YYYY-MM-DD) for the note'
+                },
+                dateStart: {
+                    type: 'string',
+                    description: 'Start date in ISO format (YYYY-MM-DD) for date range queries'
+                },
+                dateEnd: {
+                    type: 'string',
+                    description: 'End date in ISO format (YYYY-MM-DD) for date range queries'
+                },
+                title: {
+                    type: 'string',
+                    description: 'Title for creating a new date-related note'
+                },
+                content: {
+                    type: 'string',
+                    description: 'Content for creating a new date-related note'
+                },
+                parentNoteId: {
+                    type: 'string',
+                    description: 'Optional parent note ID for the new date note. If not specified, will use default calendar container.'
+                }
+            },
+            required: ['action']
+        }
+    }
+};
+
+/**
+ * Calendar integration tool implementation
+ */
+export class CalendarIntegrationTool implements ToolHandler {
+    public definition: Tool = calendarIntegrationToolDefinition;
+
+    /**
+     * Execute the calendar integration tool
+     */
+    public async execute(args: {
+        action: string,
+        date?: string,
+        dateStart?: string,
+        dateEnd?: string,
+        title?: string,
+        content?: string,
+        parentNoteId?: string
+    }): Promise<string | object> {
+        try {
+            const { action, date, dateStart, dateEnd, title, content, parentNoteId } = args;
+
+            log.info(`Executing calendar_integration tool - Action: ${action}, Date: ${date || 'not specified'}`);
+
+            // Handle different actions
+            if (action === 'find_date_notes') {
+                return await this.findDateNotes(date);
+            } else if (action === 'create_date_note') {
+                return await this.createDateNote(date, title, content, parentNoteId);
+            } else if (action === 'find_notes_with_date_range') {
+                return await this.findNotesWithDateRange(dateStart, dateEnd);
+            } else if (action === 'get_daily_note') {
+                return await this.getDailyNote(date);
+            } else {
+                return `Error: Unsupported action "${action}". Supported actions are: find_date_notes, create_date_note, find_notes_with_date_range, get_daily_note`;
+            }
+        } catch (error: any) {
+            log.error(`Error executing calendar_integration tool: ${error.message || String(error)}`);
+            return `Error: ${error.message || String(error)}`;
+        }
+    }
+
+    /**
+     * Find notes related to a specific date
+     */
+    private async findDateNotes(date?: string): Promise<object> {
+        if (!date) {
+            // If no date is provided, use today's date
+            const today = new Date();
+            date = today.toISOString().split('T')[0];
+            log.info(`No date specified, using today's date: ${date}`);
+        }
+
+        try {
+            // Validate date format
+            if (!this.isValidDate(date)) {
+                return {
+                    success: false,
+                    message: `Invalid date format. Please use YYYY-MM-DD format.`
+                };
+            }
+
+            log.info(`Finding notes related to date: ${date}`);
+
+            // Get notes with dateNote attribute matching this date
+            const notesWithDateAttribute = this.getNotesWithDateAttribute(date);
+            log.info(`Found ${notesWithDateAttribute.length} notes with date attribute for ${date}`);
+
+            // Get year, month, day notes if they exist
+            const yearMonthDayNotes = await this.getYearMonthDayNotes(date);
+
+            // Format results
+            return {
+                success: true,
+                date: date,
+                yearNote: yearMonthDayNotes.yearNote ? {
+                    noteId: yearMonthDayNotes.yearNote.noteId,
+                    title: yearMonthDayNotes.yearNote.title
+                } : null,
+                monthNote: yearMonthDayNotes.monthNote ? {
+                    noteId: yearMonthDayNotes.monthNote.noteId,
+                    title: yearMonthDayNotes.monthNote.title
+                } : null,
+                dayNote: yearMonthDayNotes.dayNote ? {
+                    noteId: yearMonthDayNotes.dayNote.noteId,
+                    title: yearMonthDayNotes.dayNote.title
+                } : null,
+                relatedNotes: notesWithDateAttribute.map(note => ({
+                    noteId: note.noteId,
+                    title: note.title,
+                    type: note.type
+                })),
+                message: `Found ${notesWithDateAttribute.length} notes related to date ${date}`
+            };
+        } catch (error: any) {
+            log.error(`Error finding date notes: ${error.message || String(error)}`);
+            throw error;
+        }
+    }
+
+    /**
+     * Create a new note associated with a date
+     */
+    private async createDateNote(date?: string, title?: string, content?: string, parentNoteId?: string): Promise<object> {
+        if (!date) {
+            // If no date is provided, use today's date
+            const today = new Date();
+            date = today.toISOString().split('T')[0];
+            log.info(`No date specified, using today's date: ${date}`);
+        }
+
+        // Validate date format
+        if (!this.isValidDate(date)) {
+            return {
+                success: false,
+                message: `Invalid date format. Please use YYYY-MM-DD format.`
+            };
+        }
+
+        if (!title) {
+            title = `Note for ${date}`;
+        }
+
+        if (!content) {
+            content = `<p>Date note created for ${date}</p>`;
+        }
+
+        try {
+            log.info(`Creating new date note for ${date} with title "${title}"`);
+
+            // If no parent is specified, try to find appropriate date container
+            if (!parentNoteId) {
+                // Get or create day note to use as parent
+                const dateComponents = this.parseDateString(date);
+                if (!dateComponents) {
+                    return {
+                        success: false,
+                        message: `Invalid date format. Please use YYYY-MM-DD format.`
+                    };
+                }
+
+                // Use the date string directly with getDayNote
+                const dayNote = await dateNotes.getDayNote(date);
+
+                if (dayNote) {
+                    parentNoteId = dayNote.noteId;
+                    log.info(`Using day note ${dayNote.title} (${parentNoteId}) as parent`);
+                } else {
+                    // Use root if day note couldn't be found/created
+                    parentNoteId = 'root';
+                    log.info(`Could not find/create day note, using root as parent`);
+                }
+            }
+
+            // Validate parent note exists
+            const parent = becca.notes[parentNoteId];
+            if (!parent) {
+                return {
+                    success: false,
+                    message: `Parent note with ID ${parentNoteId} not found. Please specify a valid parent note ID.`
+                };
+            }
+
+            // Create the new note
+            const createStartTime = Date.now();
+            const result = notes.createNewNote({
+                parentNoteId: parent.noteId,
+                title: title,
+                content: content,
+                type: 'text' as const,
+                mime: 'text/html'
+            });
+            const noteId = result.note.noteId;
+            const createDuration = Date.now() - createStartTime;
+
+            if (!noteId) {
+                return {
+                    success: false,
+                    message: `Failed to create date note. An unknown error occurred.`
+                };
+            }
+
+            log.info(`Created new note with ID ${noteId} in ${createDuration}ms`);
+
+            // Add dateNote attribute with the specified date
+            const attrStartTime = Date.now();
+            await attributes.createLabel(noteId, 'dateNote', date);
+            const attrDuration = Date.now() - attrStartTime;
+
+            log.info(`Added dateNote=${date} attribute in ${attrDuration}ms`);
+
+            // Return the new note information
+            return {
+                success: true,
+                noteId: noteId,
+                date: date,
+                title: title,
+                message: `Created new date note "${title}" for ${date}`
+            };
+        } catch (error: any) {
+            log.error(`Error creating date note: ${error.message || String(error)}`);
+            throw error;
+        }
+    }
+
+    /**
+     * Find notes with date attributes in a specified range
+     */
+    private async findNotesWithDateRange(dateStart?: string, dateEnd?: string): Promise<object> {
+        if (!dateStart || !dateEnd) {
+            return {
+                success: false,
+                message: `Both dateStart and dateEnd are required for find_notes_with_date_range action.`
+            };
+        }
+
+        // Validate date formats
+        if (!this.isValidDate(dateStart) || !this.isValidDate(dateEnd)) {
+            return {
+                success: false,
+                message: `Invalid date format. Please use YYYY-MM-DD format.`
+            };
+        }
+
+        try {
+            log.info(`Finding notes with date attributes in range ${dateStart} to ${dateEnd}`);
+
+            // Get all notes with dateNote attribute
+            const allNotes = this.getAllNotesWithDateAttribute();
+
+            // Filter by date range
+            const startDate = new Date(dateStart);
+            const endDate = new Date(dateEnd);
+
+            const filteredNotes = allNotes.filter(note => {
+                const dateAttr = note.getOwnedAttributes()
+                    .find((attr: any) => attr.name === 'dateNote');
+
+                if (dateAttr && dateAttr.value) {
+                    const noteDate = new Date(dateAttr.value);
+                    return noteDate >= startDate && noteDate <= endDate;
+                }
+
+                return false;
+            });
+
+            log.info(`Found ${filteredNotes.length} notes in date range`);
+
+            // Sort notes by date
+            filteredNotes.sort((a, b) => {
+                const aDateAttr = a.getOwnedAttributes().find((attr: any) => attr.name === 'dateNote');
+                const bDateAttr = b.getOwnedAttributes().find((attr: any) => attr.name === 'dateNote');
+
+                if (aDateAttr && bDateAttr) {
+                    const aDate = new Date(aDateAttr.value);
+                    const bDate = new Date(bDateAttr.value);
+                    return aDate.getTime() - bDate.getTime();
+                }
+
+                return 0;
+            });
+
+            // Format results
+            return {
+                success: true,
+                dateStart: dateStart,
+                dateEnd: dateEnd,
+                noteCount: filteredNotes.length,
+                notes: filteredNotes.map(note => {
+                    const dateAttr = note.getOwnedAttributes().find((attr: any) => attr.name === 'dateNote');
+                    return {
+                        noteId: note.noteId,
+                        title: note.title,
+                        type: note.type,
+                        date: dateAttr ? dateAttr.value : null
+                    };
+                }),
+                message: `Found ${filteredNotes.length} notes in date range ${dateStart} to ${dateEnd}`
+            };
+        } catch (error: any) {
+            log.error(`Error finding notes in date range: ${error.message || String(error)}`);
+            throw error;
+        }
+    }
+
+    /**
+     * Get or create a daily note for a specific date
+     */
+    private async getDailyNote(date?: string): Promise<object> {
+        if (!date) {
+            // If no date is provided, use today's date
+            const today = new Date();
+            date = today.toISOString().split('T')[0];
+            log.info(`No date specified, using today's date: ${date}`);
+        }
+
+        // Validate date format
+        if (!this.isValidDate(date)) {
+            return {
+                success: false,
+                message: `Invalid date format. Please use YYYY-MM-DD format.`
+            };
+        }
+
+        try {
+            log.info(`Getting daily note for ${date}`);
+
+            // Get or create day note - directly pass the date string
+            const startTime = Date.now();
+            const dayNote = await dateNotes.getDayNote(date);
+            const duration = Date.now() - startTime;
+
+            if (!dayNote) {
+                return {
+                    success: false,
+                    message: `Could not find or create daily note for ${date}`
+                };
+            }
+
+            log.info(`Retrieved/created daily note for ${date} in ${duration}ms`);
+
+            // Get parent month and year notes
+            const yearStr = date.substring(0, 4);
+            const monthStr = date.substring(0, 7);
+
+            const monthNote = await dateNotes.getMonthNote(monthStr);
+            const yearNote = await dateNotes.getYearNote(yearStr);
+
+            // Return the note information
+            return {
+                success: true,
+                date: date,
+                dayNote: {
+                    noteId: dayNote.noteId,
+                    title: dayNote.title,
+                    content: await dayNote.getContent()
+                },
+                monthNote: monthNote ? {
+                    noteId: monthNote.noteId,
+                    title: monthNote.title
+                } : null,
+                yearNote: yearNote ? {
+                    noteId: yearNote.noteId,
+                    title: yearNote.title
+                } : null,
+                message: `Retrieved daily note for ${date}`
+            };
+        } catch (error: any) {
+            log.error(`Error getting daily note: ${error.message || String(error)}`);
+            throw error;
+        }
+    }
+
+    /**
+     * Helper method to get notes with a specific date attribute
+     */
+    private getNotesWithDateAttribute(date: string): any[] {
+        // Find notes with matching dateNote attribute
+        return attributes.getNotesWithLabel('dateNote', date) || [];
+    }
+
+    /**
+     * Helper method to get all notes with any date attribute
+     */
+    private getAllNotesWithDateAttribute(): any[] {
+        // Find all notes with dateNote attribute
+        return attributes.getNotesWithLabel('dateNote') || [];
+    }
+
+    /**
+     * Helper method to get year, month, and day notes for a date
+     */
+    private async getYearMonthDayNotes(date: string): Promise<{
+        yearNote: any | null;
+        monthNote: any | null;
+        dayNote: any | null;
+    }> {
+        if (!this.isValidDate(date)) {
+            return { yearNote: null, monthNote: null, dayNote: null };
+        }
+
+        // Extract the year and month from the date string
+        const yearStr = date.substring(0, 4);
+        const monthStr = date.substring(0, 7);
+
+        // Use the dateNotes service to get the notes
+        const yearNote = await dateNotes.getYearNote(yearStr);
+        const monthNote = await dateNotes.getMonthNote(monthStr);
+        const dayNote = await dateNotes.getDayNote(date);
+
+        return { yearNote, monthNote, dayNote };
+    }
+
+    /**
+     * Helper method to validate date string format
+     */
+    private isValidDate(dateString: string): boolean {
+        const regex = /^\d{4}-\d{2}-\d{2}$/;
+
+        if (!regex.test(dateString)) {
+            return false;
+        }
+
+        const date = new Date(dateString);
+        return date.toString() !== 'Invalid Date';
+    }
+
+    /**
+     * Helper method to parse date string into components
+     */
+    private parseDateString(dateString: string): { year: number; month: number; day: number } | null {
+        if (!this.isValidDate(dateString)) {
+            return null;
+        }
+
+        const [yearStr, monthStr, dayStr] = dateString.split('-');
+
+        return {
+            year: parseInt(yearStr, 10),
+            month: parseInt(monthStr, 10),
+            day: parseInt(dayStr, 10)
+        };
+    }
+}
diff --git a/src/services/llm/tools/content_extraction_tool.ts b/src/services/llm/tools/content_extraction_tool.ts
new file mode 100644
index 000000000..0a1a18cd7
--- /dev/null
+++ b/src/services/llm/tools/content_extraction_tool.ts
@@ -0,0 +1,540 @@
+/**
+ * Content Extraction Tool
+ *
+ * This tool allows the LLM to extract structured information from notes.
+ */
+
+import type { Tool, ToolHandler } from './tool_interfaces.js';
+import log from '../../log.js';
+import becca from '../../../becca/becca.js';
+
+/**
+ * Definition of the content extraction tool
+ */
+export const contentExtractionToolDefinition: Tool = {
+    type: 'function',
+    function: {
+        name: 'extract_content',
+        description: 'Extract structured information from a note\'s content, such as lists, tables, or specific sections',
+        parameters: {
+            type: 'object',
+            properties: {
+                noteId: {
+                    type: 'string',
+                    description: 'ID of the note to extract content from'
+                },
+                extractionType: {
+                    type: 'string',
+                    description: 'Type of content to extract',
+                    enum: ['lists', 'tables', 'headings', 'codeBlocks', 'all']
+                },
+                format: {
+                    type: 'string',
+                    description: 'Format to return the extracted content in',
+                    enum: ['json', 'markdown', 'text']
+                },
+                query: {
+                    type: 'string',
+                    description: 'Optional search query to filter extracted content (e.g., "tasks related to finance")'
+                }
+            },
+            required: ['noteId', 'extractionType']
+        }
+    }
+};
+
+/**
+ * Content extraction tool implementation
+ */
+export class ContentExtractionTool implements ToolHandler {
+    public definition: Tool = contentExtractionToolDefinition;
+
+    /**
+     * Execute the content extraction tool
+     */
+    public async execute(args: {
+        noteId: string,
+        extractionType: 'lists' | 'tables' | 'headings' | 'codeBlocks' | 'all',
+        format?: 'json' | 'markdown' | 'text',
+        query?: string
+    }): Promise<string | object> {
+        try {
+            const { noteId, extractionType, format = 'json', query } = args;
+
+            log.info(`Executing extract_content tool - NoteID: "${noteId}", Type: ${extractionType}, Format: ${format}`);
+
+            // Get the note from becca
+            const note = becca.notes[noteId];
+
+            if (!note) {
+                log.info(`Note with ID ${noteId} not found - returning error`);
+                return `Error: Note with ID ${noteId} not found`;
+            }
+
+            log.info(`Found note: "${note.title}" (Type: ${note.type})`);
+
+            // Get the note content
+            const content = await note.getContent();
+            if (!content) {
+                return {
+                    success: false,
+                    message: 'Note content is empty'
+                };
+            }
+
+            log.info(`Retrieved note content, length: ${content.length} chars`);
+
+            // Extract the requested content
+            const extractedContent: any = {};
+
+            if (extractionType === 'lists' || extractionType === 'all') {
+                extractedContent.lists = this.extractLists(typeof content === 'string' ? content : content.toString());
+                log.info(`Extracted ${extractedContent.lists.length} lists`);
+            }
+
+            if (extractionType === 'tables' || extractionType === 'all') {
+                extractedContent.tables = this.extractTables(typeof content === 'string' ? content : content.toString());
+                log.info(`Extracted ${extractedContent.tables.length} tables`);
+            }
+
+            if (extractionType === 'headings' || extractionType === 'all') {
+                extractedContent.headings = this.extractHeadings(typeof content === 'string' ? content : content.toString());
+                log.info(`Extracted ${extractedContent.headings.length} headings`);
+            }
+
+            if (extractionType === 'codeBlocks' || extractionType === 'all') {
+                extractedContent.codeBlocks = this.extractCodeBlocks(typeof content === 'string' ? content : content.toString());
+                log.info(`Extracted ${extractedContent.codeBlocks.length} code blocks`);
+            }
+
+            // Filter by query if provided
+            if (query) {
+                log.info(`Filtering extracted content with query: "${query}"`);
+                this.filterContentByQuery(extractedContent, query);
+            }
+
+            // Format the response based on requested format
+            if (format === 'markdown') {
+                return this.formatAsMarkdown(extractedContent, extractionType);
+            } else if (format === 'text') {
+                return this.formatAsText(extractedContent, extractionType);
+            } else {
+                // Default to JSON format
+                return {
+                    success: true,
+                    noteId: note.noteId,
+                    title: note.title,
+                    extractionType,
+                    content: extractedContent
+                };
+            }
+        } catch (error: any) {
+            log.error(`Error executing extract_content tool: ${error.message || String(error)}`);
+            return `Error: ${error.message || String(error)}`;
+        }
+    }
+
+    /**
+     * Extract lists from HTML content
+     */
+    private extractLists(content: string): Array<{ type: string, items: string[] }> {
+        const lists = [];
+
+        // Extract unordered lists
+        const ulRegex = /<ul[^>]*>([\s\S]*?)<\/ul>/gi;
+        let ulMatch;
+
+        while ((ulMatch = ulRegex.exec(content)) !== null) {
+            const listContent = ulMatch[1];
+            const items = this.extractListItems(listContent);
+
+            if (items.length > 0) {
+                lists.push({
+                    type: 'unordered',
+                    items
+                });
+            }
+        }
+
+        // Extract ordered lists
+        const olRegex = /<ol[^>]*>([\s\S]*?)<\/ol>/gi;
+        let olMatch;
+
+        while ((olMatch = olRegex.exec(content)) !== null) {
+            const listContent = olMatch[1];
+            const items = this.extractListItems(listContent);
+
+            if (items.length > 0) {
+                lists.push({
+                    type: 'ordered',
+                    items
+                });
+            }
+        }
+
+        return lists;
+    }
+
+    /**
+     * Extract list items from list content
+     */
+    private extractListItems(listContent: string): string[] {
+        const items = [];
+        const itemRegex = /<li[^>]*>([\s\S]*?)<\/li>/gi;
+        let itemMatch;
+
+        while ((itemMatch = itemRegex.exec(listContent)) !== null) {
+            const itemText = this.stripHtml(itemMatch[1]).trim();
+            if (itemText) {
+                items.push(itemText);
+            }
+        }
+
+        return items;
+    }
+
+    /**
+     * Extract tables from HTML content
+     */
+    private extractTables(content: string): Array<{ headers: string[], rows: string[][] }> {
+        const tables = [];
+        const tableRegex = /<table[^>]*>([\s\S]*?)<\/table>/gi;
+        let tableMatch;
+
+        while ((tableMatch = tableRegex.exec(content)) !== null) {
+            const tableContent = tableMatch[1];
+            const headers = [];
+            const rows = [];
+
+            // Extract table headers
+            const headerRegex = /<th[^>]*>([\s\S]*?)<\/th>/gi;
+            let headerMatch;
+            while ((headerMatch = headerRegex.exec(tableContent)) !== null) {
+                headers.push(this.stripHtml(headerMatch[1]).trim());
+            }
+
+            // Extract table rows
+            const rowRegex = /<tr[^>]*>([\s\S]*?)<\/tr>/gi;
+            let rowMatch;
+            while ((rowMatch = rowRegex.exec(tableContent)) !== null) {
+                const rowContent = rowMatch[1];
+                const cells = [];
+
+                const cellRegex = /<td[^>]*>([\s\S]*?)<\/td>/gi;
+                let cellMatch;
+                while ((cellMatch = cellRegex.exec(rowContent)) !== null) {
+                    cells.push(this.stripHtml(cellMatch[1]).trim());
+                }
+
+                if (cells.length > 0) {
+                    rows.push(cells);
+                }
+            }
+
+            if (headers.length > 0 || rows.length > 0) {
+                tables.push({
+                    headers,
+                    rows
+                });
+            }
+        }
+
+        return tables;
+    }
+
+    /**
+     * Extract headings from HTML content
+     */
+    private extractHeadings(content: string): Array<{ level: number, text: string }> {
+        const headings = [];
+
+        for (let i = 1; i <= 6; i++) {
+            const headingRegex = new RegExp(`<h${i}[^>]*>([\\s\\S]*?)<\/h${i}>`, 'gi');
+            let headingMatch;
+
+            while ((headingMatch = headingRegex.exec(content)) !== null) {
+                const headingText = this.stripHtml(headingMatch[1]).trim();
+                if (headingText) {
+                    headings.push({
+                        level: i,
+                        text: headingText
+                    });
+                }
+            }
+        }
+
+        return headings;
+    }
+
+    /**
+     * Extract code blocks from HTML content
+     */
+    private extractCodeBlocks(content: string): Array<{ language?: string, code: string }> {
+        const codeBlocks = [];
+
+        // Look for <pre> and <code> blocks
+        const preRegex = /<pre[^>]*>([\s\S]*?)<\/pre>/gi;
+        let preMatch;
+
+        while ((preMatch = preRegex.exec(content)) !== null) {
+            const preContent = preMatch[1];
+            // Check if there's a nested <code> tag
+            const codeMatch = /<code[^>]*>([\s\S]*?)<\/code>/i.exec(preContent);
+
+            if (codeMatch) {
+                // Extract language if it's in the class attribute
+                const classMatch = /class="[^"]*language-([^"\s]+)[^"]*"/i.exec(preMatch[0]);
+                codeBlocks.push({
+                    language: classMatch ? classMatch[1] : undefined,
+                    code: this.decodeHtmlEntities(codeMatch[1]).trim()
+                });
+            } else {
+                // Just a <pre> without <code>
+                codeBlocks.push({
+                    code: this.decodeHtmlEntities(preContent).trim()
+                });
+            }
+        }
+
+        // Also look for standalone <code> blocks not inside <pre>
+        const standaloneCodeRegex = /(?<!<pre[^>]*>[\s\S]*?)<code[^>]*>([\s\S]*?)<\/code>/gi;
+        let standaloneCodeMatch;
+
+        while ((standaloneCodeMatch = standaloneCodeRegex.exec(content)) !== null) {
+            codeBlocks.push({
+                code: this.decodeHtmlEntities(standaloneCodeMatch[1]).trim()
+            });
+        }
+
+        return codeBlocks;
+    }
+
+    /**
+     * Filter content by query
+     */
+    private filterContentByQuery(content: any, query: string): void {
+        const lowerQuery = query.toLowerCase();
+
+        if (content.lists) {
+            content.lists = content.lists.filter((list: { type: string; items: string[] }) => {
+                // Check if any item in the list contains the query
+                return list.items.some((item: string) => item.toLowerCase().includes(lowerQuery));
+            });
+
+            // Also filter individual items in each list
+            content.lists.forEach((list: { type: string; items: string[] }) => {
+                list.items = list.items.filter((item: string) => item.toLowerCase().includes(lowerQuery));
+            });
+        }
+
+        if (content.headings) {
+            content.headings = content.headings.filter((heading: { level: number; text: string }) =>
+                heading.text.toLowerCase().includes(lowerQuery)
+            );
+        }
+
+        if (content.tables) {
+            content.tables = content.tables.filter((table: { headers: string[]; rows: string[][] }) => {
+                // Check if any header contains the query
+                const headerMatch = table.headers.some((header: string) =>
+                    header.toLowerCase().includes(lowerQuery)
+                );
+
+                // Check if any cell in any row contains the query
+                const cellMatch = table.rows.some((row: string[]) =>
+                    row.some((cell: string) => cell.toLowerCase().includes(lowerQuery))
+                );
+
+                return headerMatch || cellMatch;
+            });
+        }
+
+        if (content.codeBlocks) {
+            content.codeBlocks = content.codeBlocks.filter((block: { language?: string; code: string }) =>
+                block.code.toLowerCase().includes(lowerQuery)
+            );
+        }
+    }
+
+    /**
+     * Format extracted content as Markdown
+     */
+    private formatAsMarkdown(content: any, extractionType: string): string {
+        let markdown = '';
+
+        if (extractionType === 'lists' || extractionType === 'all') {
+            if (content.lists && content.lists.length > 0) {
+                markdown += '## Lists\n\n';
+
+                content.lists.forEach((list: any, index: number) => {
+                    markdown += `### List ${index + 1} (${list.type})\n\n`;
+
+                    list.items.forEach((item: string) => {
+                        if (list.type === 'unordered') {
+                            markdown += `- ${item}\n`;
+                        } else {
+                            markdown += `1. ${item}\n`;
+                        }
+                    });
+
+                    markdown += '\n';
+                });
+            }
+        }
+
+        if (extractionType === 'headings' || extractionType === 'all') {
+            if (content.headings && content.headings.length > 0) {
+                markdown += '## Headings\n\n';
+
+                content.headings.forEach((heading: any) => {
+                    markdown += `${'#'.repeat(heading.level)} ${heading.text}\n\n`;
+                });
+            }
+        }
+
+        if (extractionType === 'tables' || extractionType === 'all') {
+            if (content.tables && content.tables.length > 0) {
+                markdown += '## Tables\n\n';
+
+                content.tables.forEach((table: any, index: number) => {
+                    markdown += `### Table ${index + 1}\n\n`;
+
+                    // Add headers
+                    if (table.headers.length > 0) {
+                        markdown += '| ' + table.headers.join(' | ') + ' |\n';
+                        markdown += '| ' + table.headers.map(() => '---').join(' | ') + ' |\n';
+                    }
+
+                    // Add rows
+                    table.rows.forEach((row: string[]) => {
+                        markdown += '| ' + row.join(' | ') + ' |\n';
+                    });
+
+                    markdown += '\n';
+                });
+            }
+        }
+
+        if (extractionType === 'codeBlocks' || extractionType === 'all') {
+            if (content.codeBlocks && content.codeBlocks.length > 0) {
+                markdown += '## Code Blocks\n\n';
+
+                content.codeBlocks.forEach((block: any, index: number) => {
+                    markdown += `### Code Block ${index + 1}\n\n`;
+
+                    if (block.language) {
+                        markdown += '```' + block.language + '\n';
+                    } else {
+                        markdown += '```\n';
+                    }
+
+                    markdown += block.code + '\n';
+                    markdown += '```\n\n';
+                });
+            }
+        }
+
+        return markdown.trim();
+    }
+
+    /**
+     * Format extracted content as plain text
+     */
+    private formatAsText(content: any, extractionType: string): string {
+        let text = '';
+
+        if (extractionType === 'lists' || extractionType === 'all') {
+            if (content.lists && content.lists.length > 0) {
+                text += 'LISTS:\n\n';
+
+                content.lists.forEach((list: any, index: number) => {
+                    text += `List ${index + 1} (${list.type}):\n\n`;
+
+                    list.items.forEach((item: string, itemIndex: number) => {
+                        if (list.type === 'unordered') {
+                            text += `• ${item}\n`;
+                        } else {
+                            text += `${itemIndex + 1}. ${item}\n`;
+                        }
+                    });
+
+                    text += '\n';
+                });
+            }
+        }
+
+        if (extractionType === 'headings' || extractionType === 'all') {
+            if (content.headings && content.headings.length > 0) {
+                text += 'HEADINGS:\n\n';
+
+                content.headings.forEach((heading: any) => {
+                    text += `${heading.text} (Level ${heading.level})\n`;
+                });
+
+                text += '\n';
+            }
+        }
+
+        if (extractionType === 'tables' || extractionType === 'all') {
+            if (content.tables && content.tables.length > 0) {
+                text += 'TABLES:\n\n';
+
+                content.tables.forEach((table: any, index: number) => {
+                    text += `Table ${index + 1}:\n\n`;
+
+                    // Add headers
+                    if (table.headers.length > 0) {
+                        text += table.headers.join(' | ') + '\n';
+                        text += table.headers.map(() => '-----').join(' | ') + '\n';
+                    }
+
+                    // Add rows
+                    table.rows.forEach((row: string[]) => {
+                        text += row.join(' | ') + '\n';
+                    });
+
+                    text += '\n';
+                });
+            }
+        }
+
+        if (extractionType === 'codeBlocks' || extractionType === 'all') {
+            if (content.codeBlocks && content.codeBlocks.length > 0) {
+                text += 'CODE BLOCKS:\n\n';
+
+                content.codeBlocks.forEach((block: any, index: number) => {
+                    text += `Code Block ${index + 1}`;
+
+                    if (block.language) {
+                        text += ` (${block.language})`;
+                    }
+
+                    text += ':\n\n';
+                    text += block.code + '\n\n';
+                });
+            }
+        }
+
+        return text.trim();
+    }
+
+    /**
+     * Strip HTML tags from content
+     */
+    private stripHtml(html: string): string {
+        return html.replace(/<[^>]*>/g, '');
+    }
+
+    /**
+     * Decode HTML entities
+     */
+    private decodeHtmlEntities(text: string): string {
+        return text
+            .replace(/&lt;/g, '<')
+            .replace(/&gt;/g, '>')
+            .replace(/&amp;/g, '&')
+            .replace(/&quot;/g, '"')
+            .replace(/&#39;/g, "'")
+            .replace(/&nbsp;/g, ' ');
+    }
+}
diff --git a/src/services/llm/tools/keyword_search_tool.ts b/src/services/llm/tools/keyword_search_tool.ts
new file mode 100644
index 000000000..8365d38f4
--- /dev/null
+++ b/src/services/llm/tools/keyword_search_tool.ts
@@ -0,0 +1,126 @@
+/**
+ * Keyword Search Notes Tool
+ *
+ * This tool allows the LLM to search for notes using exact keyword matching and attribute-based filters.
+ * It complements the semantic search tool by providing more precise, rule-based search capabilities.
+ */
+
+import type { Tool, ToolHandler } from './tool_interfaces.js';
+import log from '../../log.js';
+import searchService from '../../search/services/search.js';
+import becca from '../../../becca/becca.js';
+
+/**
+ * Definition of the keyword search notes tool
+ */
+export const keywordSearchToolDefinition: Tool = {
+    type: 'function',
+    function: {
+        name: 'keyword_search_notes',
+        description: 'Search for notes using exact keyword matching and attribute filters. Use this for precise searches when you need exact matches or want to filter by attributes.',
+        parameters: {
+            type: 'object',
+            properties: {
+                query: {
+                    type: 'string',
+                    description: 'The search query using Trilium\'s search syntax. Examples: "rings tolkien" (find notes with both words), "#book #year >= 2000" (notes with label "book" and "year" attribute >= 2000), "note.content *=* important" (notes with "important" in content)'
+                },
+                maxResults: {
+                    type: 'number',
+                    description: 'Maximum number of results to return (default: 10)'
+                },
+                includeArchived: {
+                    type: 'boolean',
+                    description: 'Whether to include archived notes in search results (default: false)'
+                }
+            },
+            required: ['query']
+        }
+    }
+};
+
+/**
+ * Keyword search notes tool implementation
+ */
+export class KeywordSearchTool implements ToolHandler {
+    public definition: Tool = keywordSearchToolDefinition;
+
+    /**
+     * Execute the keyword search notes tool
+     */
+    public async execute(args: { query: string, maxResults?: number, includeArchived?: boolean }): Promise<string | object> {
+        try {
+            const { query, maxResults = 10, includeArchived = false } = args;
+
+            log.info(`Executing keyword_search_notes tool - Query: "${query}", MaxResults: ${maxResults}, IncludeArchived: ${includeArchived}`);
+
+            // Execute the search
+            log.info(`Performing keyword search for: "${query}"`);
+            const searchStartTime = Date.now();
+
+            // Find results with the given query
+            const searchContext = {
+                includeArchivedNotes: includeArchived,
+                fuzzyAttributeSearch: false
+            };
+
+            const searchResults = searchService.searchNotes(query, searchContext);
+            const limitedResults = searchResults.slice(0, maxResults);
+
+            const searchDuration = Date.now() - searchStartTime;
+
+            log.info(`Keyword search completed in ${searchDuration}ms, found ${searchResults.length} matching notes, returning ${limitedResults.length}`);
+
+            if (limitedResults.length > 0) {
+                // Log top results
+                limitedResults.slice(0, 3).forEach((result, index) => {
+                    log.info(`Result ${index + 1}: "${result.title}"`);
+                });
+            } else {
+                log.info(`No matching notes found for query: "${query}"`);
+            }
+
+            // Format the results
+            return {
+                count: limitedResults.length,
+                totalFound: searchResults.length,
+                results: limitedResults.map(note => {
+                    // Get a preview of the note content
+                    let contentPreview = '';
+                    try {
+                        const content = note.getContent();
+                        if (typeof content === 'string') {
+                            contentPreview = content.length > 150 ? content.substring(0, 150) + '...' : content;
+                        } else if (Buffer.isBuffer(content)) {
+                            contentPreview = '[Binary content]';
+                        } else {
+                            contentPreview = String(content).substring(0, 150) + (String(content).length > 150 ? '...' : '');
+                        }
+                    } catch (e) {
+                        contentPreview = '[Content not available]';
+                    }
+
+                    // Get note attributes
+                    const attributes = note.getOwnedAttributes().map(attr => ({
+                        type: attr.type,
+                        name: attr.name,
+                        value: attr.value
+                    }));
+
+                    return {
+                        noteId: note.noteId,
+                        title: note.title,
+                        preview: contentPreview,
+                        attributes: attributes.length > 0 ? attributes : undefined,
+                        type: note.type,
+                        mime: note.mime,
+                        isArchived: note.isArchived
+                    };
+                })
+            };
+        } catch (error: any) {
+            log.error(`Error executing keyword_search_notes tool: ${error.message || String(error)}`);
+            return `Error: ${error.message || String(error)}`;
+        }
+    }
+}
diff --git a/src/services/llm/tools/note_creation_tool.ts b/src/services/llm/tools/note_creation_tool.ts
new file mode 100644
index 000000000..9633880e4
--- /dev/null
+++ b/src/services/llm/tools/note_creation_tool.ts
@@ -0,0 +1,189 @@
+/**
+ * Note Creation Tool
+ *
+ * This tool allows the LLM to create new notes in Trilium.
+ */
+
+import type { Tool, ToolHandler } from './tool_interfaces.js';
+import log from '../../log.js';
+import becca from '../../../becca/becca.js';
+import notes from '../../notes.js';
+import attributes from '../../attributes.js';
+
+/**
+ * Definition of the note creation tool
+ */
+export const noteCreationToolDefinition: Tool = {
+    type: 'function',
+    function: {
+        name: 'create_note',
+        description: 'Create a new note in Trilium with the specified content and attributes',
+        parameters: {
+            type: 'object',
+            properties: {
+                parentNoteId: {
+                    type: 'string',
+                    description: 'System ID of the parent note under which to create the new note (not the title). This is a unique identifier like "abc123def456". If not specified, creates under root.'
+                },
+                title: {
+                    type: 'string',
+                    description: 'Title of the new note'
+                },
+                content: {
+                    type: 'string',
+                    description: 'Content of the new note'
+                },
+                type: {
+                    type: 'string',
+                    description: 'Type of the note (text, code, etc.)',
+                    enum: ['text', 'code', 'file', 'image', 'search', 'relation-map', 'book', 'mermaid', 'canvas']
+                },
+                mime: {
+                    type: 'string',
+                    description: 'MIME type of the note (e.g., text/html, application/json). Only required for certain note types.'
+                },
+                attributes: {
+                    type: 'array',
+                    description: 'Array of attributes to set on the note (e.g., [{"name":"#tag"}, {"name":"priority", "value":"high"}])',
+                    items: {
+                        type: 'object',
+                        properties: {
+                            name: {
+                                type: 'string',
+                                description: 'Name of the attribute'
+                            },
+                            value: {
+                                type: 'string',
+                                description: 'Value of the attribute (optional)'
+                            }
+                        },
+                        required: ['name']
+                    }
+                }
+            },
+            required: ['title', 'content']
+        }
+    }
+};
+
+/**
+ * Note creation tool implementation
+ */
+export class NoteCreationTool implements ToolHandler {
+    public definition: Tool = noteCreationToolDefinition;
+
+    /**
+     * Execute the note creation tool
+     */
+    public async execute(args: {
+        parentNoteId?: string,
+        title: string,
+        content: string,
+        type?: string,
+        mime?: string,
+        attributes?: Array<{ name: string, value?: string }>
+    }): Promise<string | object> {
+        try {
+            const { parentNoteId, title, content, type = 'text', mime } = args;
+
+            log.info(`Executing create_note tool - Title: "${title}", Type: ${type}, ParentNoteId: ${parentNoteId || 'root'}`);
+
+            // Validate parent note exists if specified
+            let parent = null;
+            if (parentNoteId) {
+                parent = becca.notes[parentNoteId];
+                if (!parent) {
+                    return `Error: Parent note with ID ${parentNoteId} not found. Please specify a valid parent note ID.`;
+                }
+            } else {
+                // Use root note if no parent specified
+                parent = becca.getNote('root');
+            }
+
+            // Make sure we have a valid parent at this point
+            if (!parent) {
+                return 'Error: Failed to get a valid parent note. Root note may not be accessible.';
+            }
+
+            // Determine the appropriate mime type
+            let noteMime = mime;
+            if (!noteMime) {
+                // Set default mime types based on note type
+                switch (type) {
+                    case 'text':
+                        noteMime = 'text/html';
+                        break;
+                    case 'code':
+                        noteMime = 'text/plain';
+                        break;
+                    case 'file':
+                        noteMime = 'application/octet-stream';
+                        break;
+                    case 'image':
+                        noteMime = 'image/png';
+                        break;
+                    default:
+                        noteMime = 'text/html';
+                }
+            }
+
+            // Create the note
+            const createStartTime = Date.now();
+            const result = notes.createNewNote({
+                parentNoteId: parent.noteId,
+                title: title,
+                content: content,
+                type: type as any, // Cast as any since not all string values may match the exact NoteType union
+                mime: noteMime
+            });
+            const noteId = result.note.noteId;
+            const createDuration = Date.now() - createStartTime;
+
+            if (!noteId) {
+                return 'Error: Failed to create note. An unknown error occurred.';
+            }
+
+            log.info(`Note created successfully in ${createDuration}ms, ID: ${noteId}`);
+
+            // Add attributes if specified
+            if (args.attributes && args.attributes.length > 0) {
+                log.info(`Adding ${args.attributes.length} attributes to the note`);
+
+                for (const attr of args.attributes) {
+                    if (!attr.name) continue;
+
+                    const attrStartTime = Date.now();
+                    // Use createLabel for label attributes
+                    if (attr.name.startsWith('#') || attr.name.startsWith('~')) {
+                        await attributes.createLabel(noteId, attr.name.substring(1), attr.value || '');
+                    } else {
+                        // Use createRelation for relation attributes if value looks like a note ID
+                        if (attr.value && attr.value.match(/^[a-zA-Z0-9_]{12}$/)) {
+                            await attributes.createRelation(noteId, attr.name, attr.value);
+                        } else {
+                            // Default to label for other attributes
+                            await attributes.createLabel(noteId, attr.name, attr.value || '');
+                        }
+                    }
+                    const attrDuration = Date.now() - attrStartTime;
+
+                    log.info(`Added attribute ${attr.name}=${attr.value || ''} in ${attrDuration}ms`);
+                }
+            }
+
+            // Return the new note's information
+            const newNote = becca.notes[noteId];
+
+            return {
+                success: true,
+                noteId: noteId,
+                title: newNote.title,
+                type: newNote.type,
+                message: `Note "${title}" created successfully`
+            };
+        } catch (error: any) {
+            log.error(`Error executing create_note tool: ${error.message || String(error)}`);
+            return `Error: ${error.message || String(error)}`;
+        }
+    }
+}
diff --git a/src/services/llm/tools/note_summarization_tool.ts b/src/services/llm/tools/note_summarization_tool.ts
new file mode 100644
index 000000000..bc5999e0c
--- /dev/null
+++ b/src/services/llm/tools/note_summarization_tool.ts
@@ -0,0 +1,186 @@
+/**
+ * Note Summarization Tool
+ *
+ * This tool allows the LLM to generate concise summaries of longer notes.
+ */
+
+import type { Tool, ToolHandler } from './tool_interfaces.js';
+import log from '../../log.js';
+import becca from '../../../becca/becca.js';
+import aiServiceManager from '../ai_service_manager.js';
+import { SEARCH_CONSTANTS } from '../constants/search_constants.js';
+
+/**
+ * Definition of the note summarization tool
+ */
+export const noteSummarizationToolDefinition: Tool = {
+    type: 'function',
+    function: {
+        name: 'summarize_note',
+        description: 'Generate a concise summary of a note\'s content',
+        parameters: {
+            type: 'object',
+            properties: {
+                noteId: {
+                    type: 'string',
+                    description: 'System ID of the note to summarize (not the title). This is a unique identifier like "abc123def456".'
+                },
+                maxLength: {
+                    type: 'number',
+                    description: 'Maximum length of the summary in characters (default: 500)'
+                },
+                format: {
+                    type: 'string',
+                    description: 'Format of the summary',
+                    enum: ['paragraph', 'bullets', 'executive']
+                },
+                focus: {
+                    type: 'string',
+                    description: 'Optional focus for the summary (e.g., "technical details", "key findings")'
+                }
+            },
+            required: ['noteId']
+        }
+    }
+};
+
+/**
+ * Note summarization tool implementation
+ */
+export class NoteSummarizationTool implements ToolHandler {
+    public definition: Tool = noteSummarizationToolDefinition;
+
+    /**
+     * Execute the note summarization tool
+     */
+    public async execute(args: {
+        noteId: string,
+        maxLength?: number,
+        format?: 'paragraph' | 'bullets' | 'executive',
+        focus?: string
+    }): Promise<string | object> {
+        try {
+            const { noteId, maxLength = SEARCH_CONSTANTS.LIMITS.DEFAULT_NOTE_SUMMARY_LENGTH, format = 'paragraph', focus } = args;
+
+            log.info(`Executing summarize_note tool - NoteID: "${noteId}", MaxLength: ${maxLength}, Format: ${format}`);
+
+            // Get the note from becca
+            const note = becca.notes[noteId];
+
+            if (!note) {
+                log.info(`Note with ID ${noteId} not found - returning error`);
+                return `Error: Note with ID ${noteId} not found`;
+            }
+
+            log.info(`Found note: "${note.title}" (Type: ${note.type})`);
+
+            // Get the note content
+            const content = await note.getContent();
+
+            if (!content || typeof content !== 'string' || content.trim().length === 0) {
+                return {
+                    success: false,
+                    message: 'Note content is empty or invalid'
+                };
+            }
+
+            log.info(`Retrieved note content, length: ${content.length} chars`);
+
+            // Check if content needs summarization (if it's short enough, just return it)
+            if (content.length <= maxLength && !focus) {
+                log.info(`Note content is already shorter than maxLength, returning as is`);
+                return {
+                    success: true,
+                    noteId: note.noteId,
+                    title: note.title,
+                    summary: this.cleanHtml(content),
+                    wasAlreadyShort: true
+                };
+            }
+
+            // Remove HTML tags for summarization
+            const cleanContent = this.cleanHtml(content);
+
+            // Generate the summary using the AI service
+            const aiService = aiServiceManager.getService();
+
+            if (!aiService) {
+                log.error('No AI service available for summarization');
+                return `Error: No AI service is available for summarization`;
+            }
+
+            log.info(`Using ${aiService.getName()} to generate summary`);
+
+            // Create a prompt based on format and focus
+            let prompt = `Summarize the following text`;
+
+            if (focus) {
+                prompt += ` with a focus on ${focus}`;
+            }
+
+            if (format === 'bullets') {
+                prompt += ` in a bullet point format`;
+            } else if (format === 'executive') {
+                prompt += ` as a brief executive summary`;
+            } else {
+                prompt += ` in a concise paragraph`;
+            }
+
+            prompt += `. Keep the summary under ${maxLength} characters:\n\n${cleanContent}`;
+
+            // Generate the summary
+            const summaryStartTime = Date.now();
+
+            const completion = await aiService.generateChatCompletion([
+                { role: 'system', content: 'You are a skilled summarizer. Create concise, accurate summaries while preserving the key information.' },
+                { role: 'user', content: prompt }
+            ], {
+                temperature: SEARCH_CONSTANTS.TEMPERATURE.VECTOR_SEARCH, // Lower temperature for more focused summaries
+                maxTokens: SEARCH_CONSTANTS.LIMITS.VECTOR_SEARCH_MAX_TOKENS // Enough tokens for the summary
+            });
+
+            const summaryDuration = Date.now() - summaryStartTime;
+
+            log.info(`Generated summary in ${summaryDuration}ms, length: ${completion.text.length} chars`);
+
+            return {
+                success: true,
+                noteId: note.noteId,
+                title: note.title,
+                originalLength: content.length,
+                summary: completion.text,
+                format: format,
+                focus: focus || 'general content'
+            };
+        } catch (error: any) {
+            log.error(`Error executing summarize_note tool: ${error.message || String(error)}`);
+            return `Error: ${error.message || String(error)}`;
+        }
+    }
+
+    /**
+     * Clean HTML content for summarization
+     */
+    private cleanHtml(html: string): string {
+        if (typeof html !== 'string') {
+            return '';
+        }
+
+        // Remove HTML tags
+        let text = html.replace(/<[^>]*>/g, '');
+
+        // Decode common HTML entities
+        text = text
+            .replace(/&lt;/g, '<')
+            .replace(/&gt;/g, '>')
+            .replace(/&quot;/g, '"')
+            .replace(/&#39;/g, "'")
+            .replace(/&nbsp;/g, ' ')
+            .replace(/&amp;/g, '&');
+
+        // Normalize whitespace
+        text = text.replace(/\s+/g, ' ').trim();
+
+        return text;
+    }
+}
\ No newline at end of file
diff --git a/src/services/llm/tools/note_update_tool.ts b/src/services/llm/tools/note_update_tool.ts
new file mode 100644
index 000000000..0dc5fd723
--- /dev/null
+++ b/src/services/llm/tools/note_update_tool.ts
@@ -0,0 +1,140 @@
+/**
+ * Note Update Tool
+ *
+ * This tool allows the LLM to update existing notes in Trilium.
+ */
+
+import type { Tool, ToolHandler } from './tool_interfaces.js';
+import log from '../../log.js';
+import becca from '../../../becca/becca.js';
+import notes from '../../notes.js';
+
+/**
+ * Definition of the note update tool
+ */
+export const noteUpdateToolDefinition: Tool = {
+    type: 'function',
+    function: {
+        name: 'update_note',
+        description: 'Update the content or title of an existing note',
+        parameters: {
+            type: 'object',
+            properties: {
+                noteId: {
+                    type: 'string',
+                    description: 'System ID of the note to update (not the title). This is a unique identifier like "abc123def456" that must be used to identify the specific note.'
+                },
+                title: {
+                    type: 'string',
+                    description: 'New title for the note (if you want to change it)'
+                },
+                content: {
+                    type: 'string',
+                    description: 'New content for the note (if you want to change it)'
+                },
+                mode: {
+                    type: 'string',
+                    description: 'How to update content: replace (default), append, or prepend',
+                    enum: ['replace', 'append', 'prepend']
+                }
+            },
+            required: ['noteId']
+        }
+    }
+};
+
+/**
+ * Note update tool implementation
+ */
+export class NoteUpdateTool implements ToolHandler {
+    public definition: Tool = noteUpdateToolDefinition;
+
+    /**
+     * Execute the note update tool
+     */
+    public async execute(args: { noteId: string, title?: string, content?: string, mode?: 'replace' | 'append' | 'prepend' }): Promise<string | object> {
+        try {
+            const { noteId, title, content, mode = 'replace' } = args;
+
+            if (!title && !content) {
+                return 'Error: At least one of title or content must be provided to update a note.';
+            }
+
+            log.info(`Executing update_note tool - NoteID: "${noteId}", Mode: ${mode}`);
+
+            // Get the note from becca
+            const note = becca.notes[noteId];
+
+            if (!note) {
+                log.info(`Note with ID ${noteId} not found - returning error`);
+                return `Error: Note with ID ${noteId} not found`;
+            }
+
+            log.info(`Found note: "${note.title}" (Type: ${note.type})`);
+
+            let titleUpdateResult;
+            let contentUpdateResult;
+
+            // Update title if provided
+            if (title && title !== note.title) {
+                const titleStartTime = Date.now();
+
+                try {
+                    // Update the note title by setting it and saving
+                    note.title = title;
+                    note.save();
+
+                    const titleDuration = Date.now() - titleStartTime;
+                    log.info(`Updated note title to "${title}" in ${titleDuration}ms`);
+                    titleUpdateResult = `Title updated from "${note.title}" to "${title}"`;
+                } catch (error: any) {
+                    log.error(`Error updating note title: ${error.message || String(error)}`);
+                    titleUpdateResult = `Failed to update title: ${error.message || 'Unknown error'}`;
+                }
+            }
+
+            // Update content if provided
+            if (content) {
+                const contentStartTime = Date.now();
+
+                try {
+                    let newContent = content;
+
+                    // For append or prepend modes, get the current content first
+                    if (mode === 'append' || mode === 'prepend') {
+                        const currentContent = await note.getContent();
+
+                        if (mode === 'append') {
+                            newContent = currentContent + '\n\n' + content;
+                            log.info(`Appending content to existing note content`);
+                        } else if (mode === 'prepend') {
+                            newContent = content + '\n\n' + currentContent;
+                            log.info(`Prepending content to existing note content`);
+                        }
+                    }
+
+                    await note.setContent(newContent);
+                    const contentDuration = Date.now() - contentStartTime;
+                    log.info(`Updated note content in ${contentDuration}ms, new content length: ${newContent.length}`);
+                    contentUpdateResult = `Content updated successfully (${mode} mode)`;
+                } catch (error: any) {
+                    log.error(`Error updating note content: ${error.message || String(error)}`);
+                    contentUpdateResult = `Failed to update content: ${error.message || 'Unknown error'}`;
+                }
+            }
+
+            // Return the results
+            return {
+                success: true,
+                noteId: note.noteId,
+                title: note.title,
+                titleUpdate: titleUpdateResult || 'No title update requested',
+                contentUpdate: contentUpdateResult || 'No content update requested',
+                message: `Note "${note.title}" updated successfully`
+            };
+        } catch (error: any) {
+            log.error(`Error executing update_note tool: ${error.message || String(error)}`);
+            return `Error: ${error.message || String(error)}`;
+        }
+    }
+}
diff --git a/src/services/llm/tools/read_note_tool.ts b/src/services/llm/tools/read_note_tool.ts
new file mode 100644
index 000000000..ddcad559f
--- /dev/null
+++ b/src/services/llm/tools/read_note_tool.ts
@@ -0,0 +1,121 @@
+/**
+ * Read Note Tool
+ *
+ * This tool allows the LLM to read the content of a specific note.
+ */
+
+import type { Tool, ToolHandler } from './tool_interfaces.js';
+import log from '../../log.js';
+import becca from '../../../becca/becca.js';
+
+// Define type for note response
+interface NoteResponse {
+    noteId: string;
+    title: string;
+    type: string;
+    content: string | Buffer;
+    attributes?: Array<{
+        name: string;
+        value: string;
+        type: string;
+    }>;
+}
+
+// Error type guard
+function isError(error: unknown): error is Error {
+    return error instanceof Error || (typeof error === 'object' &&
+           error !== null && 'message' in error);
+}
+
+/**
+ * Definition of the read note tool
+ */
+export const readNoteToolDefinition: Tool = {
+    type: 'function',
+    function: {
+        name: 'read_note',
+        description: 'Read the content of a specific note by its ID',
+        parameters: {
+            type: 'object',
+            properties: {
+                noteId: {
+                    type: 'string',
+                    description: 'The system ID of the note to read (not the title). This is a unique identifier like "abc123def456" that must be used to access a specific note.'
+                },
+                includeAttributes: {
+                    type: 'boolean',
+                    description: 'Whether to include note attributes in the response (default: false)'
+                }
+            },
+            required: ['noteId']
+        }
+    }
+};
+
+/**
+ * Read note tool implementation
+ */
+export class ReadNoteTool implements ToolHandler {
+    public definition: Tool = readNoteToolDefinition;
+
+    /**
+     * Execute the read note tool
+     */
+    public async execute(args: { noteId: string, includeAttributes?: boolean }): Promise<string | object> {
+        try {
+            const { noteId, includeAttributes = false } = args;
+
+            log.info(`Executing read_note tool - NoteID: "${noteId}", IncludeAttributes: ${includeAttributes}`);
+
+            // Get the note from becca
+            const note = becca.notes[noteId];
+
+            if (!note) {
+                log.info(`Note with ID ${noteId} not found - returning error`);
+                return `Error: Note with ID ${noteId} not found`;
+            }
+
+            log.info(`Found note: "${note.title}" (Type: ${note.type})`);
+
+            // Get note content
+            const startTime = Date.now();
+            const content = await note.getContent();
+            const duration = Date.now() - startTime;
+
+            log.info(`Retrieved note content in ${duration}ms, content length: ${content?.length || 0} chars`);
+
+            // Prepare the response
+            const response: NoteResponse = {
+                noteId: note.noteId,
+                title: note.title,
+                type: note.type,
+                content: content || ''
+            };
+
+            // Include attributes if requested
+            if (includeAttributes) {
+                const attributes = note.getOwnedAttributes();
+                log.info(`Including ${attributes.length} attributes in response`);
+
+                response.attributes = attributes.map(attr => ({
+                    name: attr.name,
+                    value: attr.value,
+                    type: attr.type
+                }));
+
+                if (attributes.length > 0) {
+                    // Log some example attributes
+                    attributes.slice(0, 3).forEach((attr, index) => {
+                        log.info(`Attribute ${index + 1}: ${attr.name}=${attr.value} (${attr.type})`);
+                    });
+                }
+            }
+
+            return response;
+        } catch (error: unknown) {
+            const errorMessage = isError(error) ? error.message : String(error);
+            log.error(`Error executing read_note tool: ${errorMessage}`);
+            return `Error: ${errorMessage}`;
+        }
+    }
+}
diff --git a/src/services/llm/tools/relationship_tool.ts b/src/services/llm/tools/relationship_tool.ts
new file mode 100644
index 000000000..09e16f72c
--- /dev/null
+++ b/src/services/llm/tools/relationship_tool.ts
@@ -0,0 +1,387 @@
+/**
+ * Relationship Tool
+ *
+ * This tool allows the LLM to create, identify, or modify relationships between notes.
+ */
+
+import type { Tool, ToolHandler } from './tool_interfaces.js';
+import log from '../../log.js';
+import becca from '../../../becca/becca.js';
+import attributes from '../../attributes.js';
+import aiServiceManager from '../ai_service_manager.js';
+import { SEARCH_CONSTANTS } from '../constants/search_constants.js';
+
+/**
+ * Definition of the relationship tool
+ */
+export const relationshipToolDefinition: Tool = {
+    type: 'function',
+    function: {
+        name: 'manage_relationships',
+        description: 'Create, list, or modify relationships between notes',
+        parameters: {
+            type: 'object',
+            properties: {
+                action: {
+                    type: 'string',
+                    description: 'Action to perform on relationships',
+                    enum: ['create', 'list', 'find_related', 'suggest']
+                },
+                sourceNoteId: {
+                    type: 'string',
+                    description: 'System ID of the source note for the relationship (not the title). This is a unique identifier like "abc123def456".'
+                },
+                targetNoteId: {
+                    type: 'string',
+                    description: 'System ID of the target note for the relationship (not the title). This is a unique identifier like "abc123def456".'
+                },
+                relationName: {
+                    type: 'string',
+                    description: 'Name of the relation (for create action, e.g., "references", "belongs to", "depends on")'
+                },
+                limit: {
+                    type: 'number',
+                    description: 'Maximum number of relationships to return (for list action)'
+                }
+            },
+            required: ['action', 'sourceNoteId']
+        }
+    }
+};
+
+/**
+ * Relationship tool implementation
+ */
+export class RelationshipTool implements ToolHandler {
+    public definition: Tool = relationshipToolDefinition;
+
+    /**
+     * Execute the relationship tool
+     */
+    public async execute(args: {
+        action: 'create' | 'list' | 'find_related' | 'suggest',
+        sourceNoteId: string,
+        targetNoteId?: string,
+        relationName?: string,
+        limit?: number
+    }): Promise<string | object> {
+        try {
+            const { action, sourceNoteId, targetNoteId, relationName, limit = 10 } = args;
+
+            log.info(`Executing manage_relationships tool - Action: ${action}, SourceNoteId: ${sourceNoteId}`);
+
+            // Get the source note from becca
+            const sourceNote = becca.notes[sourceNoteId];
+
+            if (!sourceNote) {
+                log.info(`Source note with ID ${sourceNoteId} not found - returning error`);
+                return `Error: Source note with ID ${sourceNoteId} not found`;
+            }
+
+            log.info(`Found source note: "${sourceNote.title}" (Type: ${sourceNote.type})`);
+
+            // Handle different actions
+            if (action === 'create') {
+                return await this.createRelationship(sourceNote, targetNoteId, relationName);
+            } else if (action === 'list') {
+                return await this.listRelationships(sourceNote, limit);
+            } else if (action === 'find_related') {
+                return await this.findRelatedNotes(sourceNote, limit);
+            } else if (action === 'suggest') {
+                return await this.suggestRelationships(sourceNote, limit);
+            } else {
+                return `Error: Unsupported action "${action}". Supported actions are: create, list, find_related, suggest`;
+            }
+        } catch (error: any) {
+            log.error(`Error executing manage_relationships tool: ${error.message || String(error)}`);
+            return `Error: ${error.message || String(error)}`;
+        }
+    }
+
+    /**
+     * Create a relationship between notes
+     */
+    private async createRelationship(sourceNote: any, targetNoteId?: string, relationName?: string): Promise<object> {
+        if (!targetNoteId) {
+            return {
+                success: false,
+                message: 'Target note ID is required for create action'
+            };
+        }
+
+        if (!relationName) {
+            return {
+                success: false,
+                message: 'Relation name is required for create action'
+            };
+        }
+
+        // Get the target note from becca
+        const targetNote = becca.notes[targetNoteId];
+
+        if (!targetNote) {
+            log.info(`Target note with ID ${targetNoteId} not found - returning error`);
+            return {
+                success: false,
+                message: `Target note with ID ${targetNoteId} not found`
+            };
+        }
+
+        log.info(`Found target note: "${targetNote.title}" (Type: ${targetNote.type})`);
+
+        try {
+            // Check if relationship already exists
+            const existingRelations = sourceNote.getRelationTargets(relationName);
+
+            for (const existingNote of existingRelations) {
+                if (existingNote.noteId === targetNoteId) {
+                    log.info(`Relationship ${relationName} already exists from "${sourceNote.title}" to "${targetNote.title}"`);
+                    return {
+                        success: false,
+                        sourceNoteId: sourceNote.noteId,
+                        sourceTitle: sourceNote.title,
+                        targetNoteId: targetNote.noteId,
+                        targetTitle: targetNote.title,
+                        relationName: relationName,
+                        message: `Relationship ${relationName} already exists from "${sourceNote.title}" to "${targetNote.title}"`
+                    };
+                }
+            }
+
+            // Create the relationship attribute
+            const startTime = Date.now();
+            await attributes.createRelation(sourceNote.noteId, relationName, targetNote.noteId);
+            const duration = Date.now() - startTime;
+
+            log.info(`Created relationship ${relationName} from "${sourceNote.title}" to "${targetNote.title}" in ${duration}ms`);
+
+            return {
+                success: true,
+                sourceNoteId: sourceNote.noteId,
+                sourceTitle: sourceNote.title,
+                targetNoteId: targetNote.noteId,
+                targetTitle: targetNote.title,
+                relationName: relationName,
+                message: `Created relationship ${relationName} from "${sourceNote.title}" to "${targetNote.title}"`
+            };
+        } catch (error: any) {
+            log.error(`Error creating relationship: ${error.message || String(error)}`);
+            throw error;
+        }
+    }
+
+    /**
+     * List relationships for a note
+     */
+    private async listRelationships(sourceNote: any, limit: number): Promise<object> {
+        try {
+            // Get outgoing relationships (where this note is the source)
+            const outgoingAttributes = sourceNote.getAttributes()
+                .filter((attr: any) => attr.type === 'relation')
+                .slice(0, limit);
+
+            const outgoingRelations = [];
+
+            for (const attr of outgoingAttributes) {
+                const targetNote = becca.notes[attr.value];
+
+                if (targetNote) {
+                    outgoingRelations.push({
+                        relationName: attr.name,
+                        targetNoteId: targetNote.noteId,
+                        targetTitle: targetNote.title
+                    });
+                }
+            }
+
+            // Get incoming relationships (where this note is the target)
+            // Since becca.findNotesWithRelation doesn't exist, use attributes to find notes with relation
+            const incomingRelations = [];
+
+            // Find all attributes of type relation that point to this note
+            const relationAttributes = sourceNote.getTargetRelations();
+
+            for (const attr of relationAttributes) {
+                if (attr.type === 'relation') {
+                    const sourceOfRelation = attr.getNote();
+
+                    if (sourceOfRelation && !sourceOfRelation.isDeleted) {
+                        incomingRelations.push({
+                            relationName: attr.name,
+                            sourceNoteId: sourceOfRelation.noteId,
+                            sourceTitle: sourceOfRelation.title
+                        });
+
+                        if (incomingRelations.length >= limit) {
+                            break;
+                        }
+                    }
+                }
+            }
+
+            log.info(`Found ${outgoingRelations.length} outgoing and ${incomingRelations.length} incoming relationships`);
+
+            return {
+                success: true,
+                noteId: sourceNote.noteId,
+                title: sourceNote.title,
+                outgoingRelations: outgoingRelations,
+                incomingRelations: incomingRelations.slice(0, limit),
+                message: `Found ${outgoingRelations.length} outgoing and ${incomingRelations.length} incoming relationships for "${sourceNote.title}"`
+            };
+        } catch (error: any) {
+            log.error(`Error listing relationships: ${error.message || String(error)}`);
+            throw error;
+        }
+    }
+
+    /**
+     * Find related notes using vector similarity
+     */
+    private async findRelatedNotes(sourceNote: any, limit: number): Promise<object> {
+        try {
+            // Get the vector search tool from the AI service manager
+            const vectorSearchTool = aiServiceManager.getVectorSearchTool();
+
+            if (!vectorSearchTool) {
+                log.error('Vector search tool not available');
+                return {
+                    success: false,
+                    message: 'Vector search capability not available'
+                };
+            }
+
+            log.info(`Using vector search to find notes related to "${sourceNote.title}"`);
+
+            // Get note content for semantic search
+            const content = await sourceNote.getContent();
+            const title = sourceNote.title;
+
+            // Use both title and content for search
+            const searchQuery = title + (content && typeof content === 'string' ? ': ' + content.substring(0, 500) : '');
+
+            // Execute the search
+            const searchStartTime = Date.now();
+            const results = await vectorSearchTool.searchNotes(searchQuery, {
+                maxResults: limit + 1 // Add 1 to account for the source note itself
+            });
+            const searchDuration = Date.now() - searchStartTime;
+
+            // Filter out the source note from results
+            const filteredResults = results.filter(note => note.noteId !== sourceNote.noteId);
+            log.info(`Found ${filteredResults.length} related notes in ${searchDuration}ms`);
+
+            return {
+                success: true,
+                noteId: sourceNote.noteId,
+                title: sourceNote.title,
+                relatedNotes: filteredResults.slice(0, limit).map(note => ({
+                    noteId: note.noteId,
+                    title: note.title,
+                    similarity: Math.round(note.similarity * 100) / 100
+                })),
+                message: `Found ${filteredResults.length} notes semantically related to "${sourceNote.title}"`
+            };
+        } catch (error: any) {
+            log.error(`Error finding related notes: ${error.message || String(error)}`);
+            throw error;
+        }
+    }
+
+    /**
+     * Suggest possible relationships based on content analysis
+     */
+    private async suggestRelationships(sourceNote: any, limit: number): Promise<object> {
+        try {
+            // First, find related notes using vector search
+            const relatedResult = await this.findRelatedNotes(sourceNote, limit) as any;
+
+            if (!relatedResult.success || !relatedResult.relatedNotes || relatedResult.relatedNotes.length === 0) {
+                return {
+                    success: false,
+                    message: 'Could not find any related notes to suggest relationships'
+                };
+            }
+
+            // Get the AI service for relationship suggestion
+            const aiService = aiServiceManager.getService();
+
+            if (!aiService) {
+                log.error('No AI service available for relationship suggestions');
+                return {
+                    success: false,
+                    message: 'AI service not available for relationship suggestions',
+                    relatedNotes: relatedResult.relatedNotes
+                };
+            }
+
+            log.info(`Using ${aiService.getName()} to suggest relationships for ${relatedResult.relatedNotes.length} related notes`);
+
+            // Get the source note content
+            const sourceContent = await sourceNote.getContent();
+
+            // Prepare suggestions
+            const suggestions = [];
+
+            for (const relatedNote of relatedResult.relatedNotes) {
+                try {
+                    // Get the target note content
+                    const targetNote = becca.notes[relatedNote.noteId];
+                    const targetContent = await targetNote.getContent();
+
+                    // Prepare a prompt for the AI service
+                    const prompt = `Analyze the relationship between these two notes and suggest a descriptive relation name (like "references", "implements", "depends on", etc.)
+
+SOURCE NOTE: "${sourceNote.title}"
+${typeof sourceContent === 'string' ? sourceContent.substring(0, 300) : ''}
+
+TARGET NOTE: "${targetNote.title}"
+${typeof targetContent === 'string' ? targetContent.substring(0, 300) : ''}
+
+Suggest the most appropriate relationship type that would connect the source note to the target note. Reply with ONLY the relationship name, nothing else.`;
+
+                    // Get the suggestion
+                    const completion = await aiService.generateChatCompletion([
+                        {
+                            role: 'system',
+                            content: 'You analyze the relationship between notes and suggest a concise, descriptive relation name.'
+                        },
+                        { role: 'user', content: prompt }
+                    ], {
+                        temperature: SEARCH_CONSTANTS.TEMPERATURE.RELATIONSHIP_TOOL,
+                        maxTokens: SEARCH_CONSTANTS.LIMITS.RELATIONSHIP_TOOL_MAX_TOKENS
+                    });
+
+                    // Extract just the relation name (remove any formatting or explanation)
+                    const relationName = completion.text
+                        .replace(/^["']|["']$/g, '') // Remove quotes
+                        .replace(/^relationship:|\./gi, '') // Remove prefixes/suffixes
+                        .trim();
+
+                    suggestions.push({
+                        targetNoteId: relatedNote.noteId,
+                        targetTitle: relatedNote.title,
+                        similarity: relatedNote.similarity,
+                        suggestedRelation: relationName
+                    });
+
+                    log.info(`Suggested relationship "${relationName}" from "${sourceNote.title}" to "${targetNote.title}"`);
+                } catch (error: any) {
+                    log.error(`Error generating suggestion: ${error.message || String(error)}`);
+                    // Continue with other suggestions
+                }
+            }
+
+            return {
+                success: true,
+                noteId: sourceNote.noteId,
+                title: sourceNote.title,
+                suggestions: suggestions,
+                message: `Generated ${suggestions.length} relationship suggestions for "${sourceNote.title}"`
+            };
+        } catch (error: any) {
+            log.error(`Error suggesting relationships: ${error.message || String(error)}`);
+            throw error;
+        }
+    }
+}
diff --git a/src/services/llm/tools/search_notes_tool.ts b/src/services/llm/tools/search_notes_tool.ts
new file mode 100644
index 000000000..014c0c795
--- /dev/null
+++ b/src/services/llm/tools/search_notes_tool.ts
@@ -0,0 +1,273 @@
+/**
+ * Search Notes Tool
+ *
+ * This tool allows the LLM to search for notes using semantic search.
+ */
+
+import type { Tool, ToolHandler } from './tool_interfaces.js';
+import log from '../../log.js';
+import aiServiceManager from '../ai_service_manager.js';
+import becca from '../../../becca/becca.js';
+import { ContextExtractor } from '../context/index.js';
+
+/**
+ * Definition of the search notes tool
+ */
+export const searchNotesToolDefinition: Tool = {
+    type: 'function',
+    function: {
+        name: 'search_notes',
+        description: 'Search for notes in the database using semantic search. Returns notes most semantically related to the query.',
+        parameters: {
+            type: 'object',
+            properties: {
+                query: {
+                    type: 'string',
+                    description: 'The search query to find semantically related notes'
+                },
+                parentNoteId: {
+                    type: 'string',
+                    description: 'Optional system ID of the parent note to restrict search to a specific branch (not the title). This is a unique identifier like "abc123def456".'
+                },
+                maxResults: {
+                    type: 'number',
+                    description: 'Maximum number of results to return (default: 5)'
+                },
+                summarize: {
+                    type: 'boolean',
+                    description: 'Whether to provide summarized content previews instead of truncated ones (default: false)'
+                }
+            },
+            required: ['query']
+        }
+    }
+};
+
+/**
+ * Get or create the vector search tool dependency
+ * @returns The vector search tool or null if it couldn't be created
+ */
+async function getOrCreateVectorSearchTool(): Promise<any> {
+    try {
+        // Try to get the existing vector search tool
+        let vectorSearchTool = aiServiceManager.getVectorSearchTool();
+
+        if (vectorSearchTool) {
+            log.info(`Found existing vectorSearchTool`);
+            return vectorSearchTool;
+        }
+
+        // No existing tool, try to initialize it
+        log.info(`VectorSearchTool not found, attempting initialization`);
+
+        // Get agent tools manager and initialize it
+        const agentTools = aiServiceManager.getAgentTools();
+        if (agentTools && typeof agentTools.initialize === 'function') {
+            log.info('Initializing agent tools to create vectorSearchTool');
+            try {
+                // Force initialization to ensure it runs even if previously marked as initialized
+                await agentTools.initialize(true);
+                log.info('Agent tools initialized successfully');
+            } catch (initError: any) {
+                log.error(`Failed to initialize agent tools: ${initError.message}`);
+                return null;
+            }
+        } else {
+            log.error('Agent tools manager not available');
+            return null;
+        }
+
+        // Try getting the vector search tool again after initialization
+        vectorSearchTool = aiServiceManager.getVectorSearchTool();
+
+        if (vectorSearchTool) {
+            log.info('Successfully created vectorSearchTool');
+            return vectorSearchTool;
+        } else {
+            log.error('Failed to create vectorSearchTool after initialization');
+            return null;
+        }
+    } catch (error: any) {
+        log.error(`Error getting or creating vectorSearchTool: ${error.message}`);
+        return null;
+    }
+}
+
+/**
+ * Search notes tool implementation
+ */
+export class SearchNotesTool implements ToolHandler {
+    public definition: Tool = searchNotesToolDefinition;
+    private contextExtractor: ContextExtractor;
+
+    constructor() {
+        this.contextExtractor = new ContextExtractor();
+    }
+
+    /**
+     * Get rich content preview for a note
+     * This provides a better preview than the simple truncation in VectorSearchTool
+     */
+    private async getRichContentPreview(noteId: string, summarize: boolean): Promise<string> {
+        try {
+            const note = becca.getNote(noteId);
+            if (!note) {
+                return 'Note not found';
+            }
+
+            // Get the full content with proper formatting
+            const formattedContent = await this.contextExtractor.getNoteContent(noteId);
+            if (!formattedContent) {
+                return 'No content available';
+            }
+
+            // If summarization is requested
+            if (summarize) {
+                // Try to get an LLM service for summarization
+                const llmService = aiServiceManager.getService();
+                if (llmService) {
+                    try {
+                        const messages = [
+                            {
+                                role: "system" as const,
+                                content: "Summarize the following note content concisely while preserving key information. Keep your summary to about 3-4 sentences."
+                            },
+                            {
+                                role: "user" as const,
+                                content: `Note title: ${note.title}\n\nContent:\n${formattedContent}`
+                            }
+                        ];
+
+                        // Request summarization with safeguards to prevent recursion
+                        const result = await llmService.generateChatCompletion(messages, {
+                            temperature: 0.3,
+                            maxTokens: 200,
+                            // Use any to bypass the type checking for special parameters
+                            ...(({
+                                bypassFormatter: true,
+                                bypassContextProcessing: true
+                            } as any))
+                        });
+
+                        if (result && result.text) {
+                            return result.text;
+                        }
+                    } catch (error) {
+                        log.error(`Error summarizing content: ${error}`);
+                        // Fall through to smart truncation if summarization fails
+                    }
+                }
+            }
+
+            // Fall back to smart truncation if summarization fails or isn't requested
+            const previewLength = Math.min(formattedContent.length, 600);
+            let preview = formattedContent.substring(0, previewLength);
+
+            // Only add ellipsis if we've truncated the content
+            if (previewLength < formattedContent.length) {
+                // Try to find a natural break point
+                const breakPoints = ['. ', '.\n', '\n\n', '\n', '. '];
+                let breakFound = false;
+
+                for (const breakPoint of breakPoints) {
+                    const lastBreak = preview.lastIndexOf(breakPoint);
+                    if (lastBreak > previewLength * 0.6) { // At least 60% of the way through
+                        preview = preview.substring(0, lastBreak + breakPoint.length);
+                        breakFound = true;
+                        break;
+                    }
+                }
+
+                // Add ellipsis if truncated
+                preview += '...';
+            }
+
+            return preview;
+        } catch (error) {
+            log.error(`Error getting rich content preview: ${error}`);
+            return 'Error retrieving content preview';
+        }
+    }
+
+    /**
+     * Execute the search notes tool
+     */
+    public async execute(args: {
+        query: string,
+        parentNoteId?: string,
+        maxResults?: number,
+        summarize?: boolean
+    }): Promise<string | object> {
+        try {
+            const {
+                query,
+                parentNoteId,
+                maxResults = 5,
+                summarize = false
+            } = args;
+
+            log.info(`Executing search_notes tool - Query: "${query}", ParentNoteId: ${parentNoteId || 'not specified'}, MaxResults: ${maxResults}, Summarize: ${summarize}`);
+
+            // Get the vector search tool from the AI service manager
+            const vectorSearchTool = await getOrCreateVectorSearchTool();
+
+            if (!vectorSearchTool) {
+                return `Error: Vector search tool is not available. The system may still be initializing or there could be a configuration issue.`;
+            }
+
+            log.info(`Retrieved vector search tool from AI service manager`);
+
+            // Check if searchNotes method exists
+            if (!vectorSearchTool.searchNotes || typeof vectorSearchTool.searchNotes !== 'function') {
+                log.error(`Vector search tool is missing searchNotes method`);
+                return `Error: Vector search tool is improperly configured (missing searchNotes method).`;
+            }
+
+            // Execute the search
+            log.info(`Performing semantic search for: "${query}"`);
+            const searchStartTime = Date.now();
+            const results = await vectorSearchTool.searchNotes(query, {
+                parentNoteId,
+                maxResults
+                // Don't pass summarize - we'll handle it ourselves
+            });
+            const searchDuration = Date.now() - searchStartTime;
+
+            log.info(`Search completed in ${searchDuration}ms, found ${results.length} matching notes`);
+
+            if (results.length > 0) {
+                // Log top results
+                results.slice(0, 3).forEach((result: any, index: number) => {
+                    log.info(`Result ${index + 1}: "${result.title}" (similarity: ${Math.round(result.similarity * 100)}%)`);
+                });
+            } else {
+                log.info(`No matching notes found for query: "${query}"`);
+            }
+
+            // Get enhanced previews for each result
+            const enhancedResults = await Promise.all(
+                results.map(async (result: any) => {
+                    const preview = await this.getRichContentPreview(result.noteId, summarize);
+
+                    return {
+                        noteId: result.noteId,
+                        title: result.title,
+                        preview: preview,
+                        similarity: Math.round(result.similarity * 100) / 100,
+                        parentId: result.parentId
+                    };
+                })
+            );
+
+            // Format the results
+            return {
+                count: enhancedResults.length,
+                results: enhancedResults,
+                message: "Note: Use the noteId (not the title) when performing operations on specific notes with other tools."
+            };
+        } catch (error: any) {
+            log.error(`Error executing search_notes tool: ${error.message || String(error)}`);
+            return `Error: ${error.message || String(error)}`;
+        }
+    }
+}
diff --git a/src/services/llm/tools/search_suggestion_tool.ts b/src/services/llm/tools/search_suggestion_tool.ts
new file mode 100644
index 000000000..6962e65b2
--- /dev/null
+++ b/src/services/llm/tools/search_suggestion_tool.ts
@@ -0,0 +1,179 @@
+/**
+ * Search Suggestion Tool
+ *
+ * This tool provides guidance on how to formulate different types of search queries in Trilium.
+ * It helps the LLM understand the correct syntax for various search scenarios.
+ */
+
+import type { Tool, ToolHandler } from './tool_interfaces.js';
+import log from '../../log.js';
+
+// Template types
+type QueryTemplate = {
+    template: string;
+    description: string;
+};
+
+type SearchTypesMap = {
+    basic: QueryTemplate[];
+    attribute: QueryTemplate[];
+    content: QueryTemplate[];
+    relation: QueryTemplate[];
+    date: QueryTemplate[];
+    advanced: QueryTemplate[];
+};
+
+type SearchType = keyof SearchTypesMap;
+
+/**
+ * Definition of the search suggestion tool
+ */
+export const searchSuggestionToolDefinition: Tool = {
+    type: 'function',
+    function: {
+        name: 'search_suggestion',
+        description: 'Get suggestions on how to formulate different types of search queries in Trilium. Use this when you need help constructing the right search syntax.',
+        parameters: {
+            type: 'object',
+            properties: {
+                searchType: {
+                    type: 'string',
+                    description: 'Type of search you want suggestions for',
+                    enum: [
+                        'basic',
+                        'attribute',
+                        'content',
+                        'relation',
+                        'date',
+                        'advanced'
+                    ]
+                },
+                userQuery: {
+                    type: 'string',
+                    description: 'The user\'s original query or description of what they want to search for'
+                }
+            },
+            required: ['searchType']
+        }
+    }
+};
+
+/**
+ * Search suggestion tool implementation
+ */
+export class SearchSuggestionTool implements ToolHandler {
+    public definition: Tool = searchSuggestionToolDefinition;
+
+    // Example query templates for each search type
+    private queryTemplates: SearchTypesMap = {
+        basic: [
+            { template: '"{term1}"', description: 'Exact phrase search' },
+            { template: '{term1} {term2}', description: 'Find notes containing both terms' },
+            { template: '{term1} OR {term2}', description: 'Find notes containing either term' }
+        ],
+        attribute: [
+            { template: '#{attributeName}', description: 'Find notes with a specific label' },
+            { template: '#{attributeName} = {value}', description: 'Find notes with label equal to value' },
+            { template: '#{attributeName} >= {value}', description: 'Find notes with numeric label greater or equal to value' },
+            { template: '#{attributeName} *= {value}', description: 'Find notes with label containing value' },
+            { template: '~{relationName}.title *= {value}', description: 'Find notes with relation to note whose title contains value' }
+        ],
+        content: [
+            { template: 'note.content *= "{text}"', description: 'Find notes containing specific text in content' },
+            { template: 'note.content =* "{text}"', description: 'Find notes whose content starts with text' },
+            { template: 'note.content %= "{regex}"', description: 'Find notes whose content matches regex pattern' }
+        ],
+        relation: [
+            { template: '~{relationName}', description: 'Find notes with a specific relation' },
+            { template: '~{relationName}.title *= {text}', description: 'Find notes related to notes with title containing text' },
+            { template: '~{relationName}.#tag', description: 'Find notes related to notes with specific label' }
+        ],
+        date: [
+            { template: '#dateNote = MONTH', description: 'Find notes with dateNote attribute equal to current month' },
+            { template: '#dateNote >= TODAY-7', description: 'Find notes with dateNote in the last week' },
+            { template: '#dateCreated >= YEAR-1', description: 'Find notes created within the last year' }
+        ],
+        advanced: [
+            { template: '#book AND #year >= 2020 AND note.content *= "important"', description: 'Combined attribute and content search' },
+            { template: '#project AND (#status=active OR #status=pending)', description: 'Complex attribute condition' },
+            { template: 'note.children.title *= {text}', description: 'Find notes whose children contain text in title' }
+        ]
+    };
+
+    /**
+     * Execute the search suggestion tool
+     */
+    public async execute(args: { searchType: string, userQuery?: string }): Promise<string | object> {
+        try {
+            const { searchType, userQuery = '' } = args;
+
+            log.info(`Executing search_suggestion tool - Type: "${searchType}", UserQuery: "${userQuery}"`);
+
+            // Validate search type
+            if (!this.isValidSearchType(searchType)) {
+                return {
+                    error: `Invalid search type: ${searchType}`,
+                    validTypes: Object.keys(this.queryTemplates)
+                };
+            }
+
+            // Generate suggestions based on search type and user query
+            const templates = this.queryTemplates[searchType as SearchType];
+
+            // Extract potential terms from the user query
+            const terms = userQuery
+                .split(/\s+/)
+                .filter(term => term.length > 2)
+                .map(term => term.replace(/[^\w\s]/g, ''));
+
+            // Fill templates with user terms if available
+            const suggestions = templates.map((template: QueryTemplate) => {
+                let filledTemplate = template.template;
+
+                // Try to fill in term1, term2, etc.
+                if (terms.length > 0) {
+                    for (let i = 0; i < Math.min(terms.length, 3); i++) {
+                        filledTemplate = filledTemplate.replace(`{term${i+1}}`, terms[i]);
+                    }
+                }
+
+                // For attribute/relation examples, try to use something meaningful
+                if (searchType === 'attribute' || searchType === 'relation') {
+                    // These are common attribute/relation names in note-taking contexts
+                    const commonAttributes = ['tag', 'category', 'status', 'priority', 'project', 'area', 'year'];
+                    filledTemplate = filledTemplate.replace('{attributeName}', commonAttributes[Math.floor(Math.random() * commonAttributes.length)]);
+                    filledTemplate = filledTemplate.replace('{relationName}', 'parent');
+                }
+
+                // Fill remaining placeholders with generic examples
+                filledTemplate = filledTemplate
+                    .replace('{text}', terms[0] || 'example')
+                    .replace('{value}', terms[1] || 'value')
+                    .replace('{regex}', '[a-z]+');
+
+                return {
+                    query: filledTemplate,
+                    description: template.description
+                };
+            });
+
+            return {
+                searchType,
+                userQuery,
+                suggestions,
+                note: "Use these suggestions with keyword_search_notes or attribute_search tools to find relevant notes."
+            };
+
+        } catch (error: any) {
+            log.error(`Error executing search_suggestion tool: ${error.message || String(error)}`);
+            return `Error: ${error.message || String(error)}`;
+        }
+    }
+
+    /**
+     * Check if a search type is valid
+     */
+    private isValidSearchType(searchType: string): searchType is SearchType {
+        return Object.keys(this.queryTemplates).includes(searchType);
+    }
+}
diff --git a/src/services/llm/tools/tool_initializer.ts b/src/services/llm/tools/tool_initializer.ts
new file mode 100644
index 000000000..e8ceca3ee
--- /dev/null
+++ b/src/services/llm/tools/tool_initializer.ts
@@ -0,0 +1,68 @@
+/**
+ * Tool Initializer
+ *
+ * This module initializes all available tools for the LLM to use.
+ */
+
+import toolRegistry from './tool_registry.js';
+import { SearchNotesTool } from './search_notes_tool.js';
+import { KeywordSearchTool } from './keyword_search_tool.js';
+import { AttributeSearchTool } from './attribute_search_tool.js';
+import { SearchSuggestionTool } from './search_suggestion_tool.js';
+import { ReadNoteTool } from './read_note_tool.js';
+import { NoteCreationTool } from './note_creation_tool.js';
+import { NoteUpdateTool } from './note_update_tool.js';
+import { ContentExtractionTool } from './content_extraction_tool.js';
+import { RelationshipTool } from './relationship_tool.js';
+import { AttributeManagerTool } from './attribute_manager_tool.js';
+import { CalendarIntegrationTool } from './calendar_integration_tool.js';
+import { NoteSummarizationTool } from './note_summarization_tool.js';
+import log from '../../log.js';
+
+// Error type guard
+function isError(error: unknown): error is Error {
+    return error instanceof Error || (typeof error === 'object' &&
+           error !== null && 'message' in error);
+}
+
+/**
+ * Initialize all tools for the LLM
+ */
+export async function initializeTools(): Promise<void> {
+    try {
+        log.info('Initializing LLM tools...');
+
+        // Register search and discovery tools
+        toolRegistry.registerTool(new SearchNotesTool());        // Semantic search
+        toolRegistry.registerTool(new KeywordSearchTool());      // Keyword-based search
+        toolRegistry.registerTool(new AttributeSearchTool());    // Attribute-specific search
+        toolRegistry.registerTool(new SearchSuggestionTool());   // Search syntax helper
+        toolRegistry.registerTool(new ReadNoteTool());           // Read note content
+
+        // Register note creation and manipulation tools
+        toolRegistry.registerTool(new NoteCreationTool());       // Create new notes
+        toolRegistry.registerTool(new NoteUpdateTool());         // Update existing notes
+        toolRegistry.registerTool(new NoteSummarizationTool());  // Summarize note content
+
+        // Register attribute and relationship tools
+        toolRegistry.registerTool(new AttributeManagerTool());   // Manage note attributes
+        toolRegistry.registerTool(new RelationshipTool());       // Manage note relationships
+
+        // Register content analysis tools
+        toolRegistry.registerTool(new ContentExtractionTool());  // Extract info from note content
+        toolRegistry.registerTool(new CalendarIntegrationTool()); // Calendar-related operations
+
+        // Log registered tools
+        const toolCount = toolRegistry.getAllTools().length;
+        const toolNames = toolRegistry.getAllTools().map(tool => tool.definition.function.name).join(', ');
+        log.info(`Successfully registered ${toolCount} LLM tools: ${toolNames}`);
+    } catch (error: unknown) {
+        const errorMessage = isError(error) ? error.message : String(error);
+        log.error(`Error initializing LLM tools: ${errorMessage}`);
+        // Don't throw, just log the error to prevent breaking the pipeline
+    }
+}
+
+export default {
+    initializeTools
+};
diff --git a/src/services/llm/tools/tool_interfaces.ts b/src/services/llm/tools/tool_interfaces.ts
new file mode 100644
index 000000000..ec90df67f
--- /dev/null
+++ b/src/services/llm/tools/tool_interfaces.ts
@@ -0,0 +1,69 @@
+/**
+ * Tool Interfaces
+ *
+ * This file defines the interfaces for the LLM tool calling system.
+ *
+ * IMPORTANT NOTE ON NOTE IDs:
+ * When working with notes in Trilium, it's crucial to understand that:
+ * - Each note has a unique system ID (e.g., "abc123def456") which is different from its title
+ * - When tools require a noteId parameter, they need this system ID, not the title
+ * - Search tools return noteIds that should be used in subsequent operations on specific notes
+ * - Using a note's title instead of its ID will cause operations to fail
+ */
+
+/**
+ * Interface for a tool definition to be sent to the LLM
+ */
+export interface Tool {
+    type: 'function';
+    function: {
+        name: string;
+        description: string;
+        parameters: {
+            type: 'object';
+            properties: Record<string, ToolParameter>;
+            required: string[];
+        };
+    };
+}
+
+/**
+ * Interface for a tool parameter
+ */
+export interface ToolParameter {
+    type: string;
+    description: string;
+    enum?: string[];
+    items?: ToolParameter | {
+        type: string;
+        properties?: Record<string, ToolParameter>;
+        required?: string[];
+    };
+}
+
+/**
+ * Interface for a tool call from the LLM
+ */
+export interface ToolCall {
+    id?: string;
+    type?: string;
+    function: {
+        name: string;
+        arguments: Record<string, unknown> | string;
+    };
+}
+
+/**
+ * Interface for a tool handler that executes a tool
+ */
+export interface ToolHandler {
+    /**
+     * Tool definition to be sent to the LLM
+     */
+    definition: Tool;
+
+    /**
+     * Execute the tool with the given arguments
+     */
+    execute(args: Record<string, unknown>): Promise<string | object>;
+}
diff --git a/src/services/llm/tools/tool_registry.ts b/src/services/llm/tools/tool_registry.ts
new file mode 100644
index 000000000..9ad41fdce
--- /dev/null
+++ b/src/services/llm/tools/tool_registry.ts
@@ -0,0 +1,163 @@
+/**
+ * Tool Registry
+ *
+ * This file defines the registry for tools that can be called by LLMs.
+ */
+
+import type { Tool, ToolHandler } from './tool_interfaces.js';
+import log from '../../log.js';
+
+/**
+ * Registry for tools that can be called by LLMs
+ */
+export class ToolRegistry {
+    private static instance: ToolRegistry;
+    private tools: Map<string, ToolHandler> = new Map();
+    private initializationAttempted: boolean = false;
+
+    private constructor() {}
+
+    /**
+     * Get singleton instance of the tool registry
+     */
+    public static getInstance(): ToolRegistry {
+        if (!ToolRegistry.instance) {
+            ToolRegistry.instance = new ToolRegistry();
+        }
+
+        return ToolRegistry.instance;
+    }
+
+    /**
+     * Try to initialize tools if registry is empty
+     */
+    private tryInitializeTools(): boolean {
+        if (this.initializationAttempted || this.tools.size > 0) {
+            return this.tools.size > 0;
+        }
+
+        this.initializationAttempted = true;
+        log.info("Tool registry is empty, attempting synchronous initialization");
+
+        try {
+            // Use existing tooling to initialize
+            // This is a light touch, not creating anything new
+            log.info("Tools should be initialized by AIServiceManager constructor");
+            return this.tools.size > 0;
+        } catch (error: any) {
+            log.error(`Error during tool initialization attempt: ${error.message}`);
+            return false;
+        }
+    }
+
+    /**
+     * Validate a tool to ensure it's properly initialized
+     * @param handler Tool handler to validate
+     */
+    private validateToolHandler(handler: ToolHandler): boolean {
+        try {
+            if (!handler) {
+                log.error(`Invalid tool handler: null or undefined`);
+                return false;
+            }
+
+            if (!handler.definition) {
+                log.error(`Tool handler is missing definition`);
+                return false;
+            }
+
+            if (!handler.definition.function || !handler.definition.function.name) {
+                log.error(`Tool definition is missing function name`);
+                return false;
+            }
+
+            if (!handler.execute || typeof handler.execute !== 'function') {
+                log.error(`Tool '${handler.definition.function.name}' is missing execute method`);
+                return false;
+            }
+
+            // Try to invoke the execute method with a test parameter to verify it's bound properly
+            // We don't actually execute, just check that it's callable
+            if (handler.execute.toString().includes('[native code]')) {
+                log.error(`Tool '${handler.definition.function.name}' has an unbound execute method`);
+                return false;
+            }
+
+            return true;
+        } catch (error: any) {
+            log.error(`Error validating tool handler: ${error.message}`);
+            return false;
+        }
+    }
+
+    /**
+     * Register a tool with the registry
+     */
+    public registerTool(handler: ToolHandler): void {
+        if (!this.validateToolHandler(handler)) {
+            log.error(`Failed to register tool: validation failed`);
+            return;
+        }
+
+        const name = handler.definition.function.name;
+
+        if (this.tools.has(name)) {
+            log.info(`Tool '${name}' already registered, replacing...`);
+        }
+
+        this.tools.set(name, handler);
+        log.info(`Registered tool: ${name}`);
+    }
+
+    /**
+     * Get a tool by name
+     */
+    public getTool(name: string): ToolHandler | undefined {
+        // Try initialization if registry is empty
+        if (this.tools.size === 0) {
+            this.tryInitializeTools();
+        }
+
+        const tool = this.tools.get(name);
+
+        if (!tool) {
+            log.error(`Tool '${name}' not found in registry`);
+            return undefined;
+        }
+
+        // Validate the tool before returning it
+        if (!this.validateToolHandler(tool)) {
+            log.error(`Tool '${name}' failed validation when retrieved`);
+            return undefined;
+        }
+
+        return tool;
+    }
+
+    /**
+     * Get all registered tools
+     */
+    public getAllTools(): ToolHandler[] {
+        // Try initialization if registry is empty
+        if (this.tools.size === 0) {
+            this.tryInitializeTools();
+        }
+
+        // Filter out any tools that fail validation
+        return Array.from(this.tools.values()).filter(tool => this.validateToolHandler(tool));
+    }
+
+    /**
+     * Get all tool definitions for sending to LLM
+     */
+    public getAllToolDefinitions(): Tool[] {
+        // Only get definitions from valid tools
+        const validTools = this.getAllTools();
+        const toolDefs = validTools.map(handler => handler.definition);
+        return toolDefs;
+    }
+}
+
+// Export singleton instance
+const toolRegistry = ToolRegistry.getInstance();
+export default toolRegistry;
diff --git a/src/services/llm/utils/json_extractor.ts b/src/services/llm/utils/json_extractor.ts
new file mode 100644
index 000000000..5196544c3
--- /dev/null
+++ b/src/services/llm/utils/json_extractor.ts
@@ -0,0 +1,387 @@
+import log from '../../log.js';
+
+/**
+ * Options for JSON extraction
+ */
+export interface JsonExtractionOptions {
+    /** Attempt to find and extract arrays as the primary target (for query enhancers, etc.) */
+    extractArrays?: boolean;
+    /** Minimum length for extracted strings to be considered valid */
+    minStringLength?: number;
+    /** Apply fixes to malformed JSON before parsing */
+    applyFixes?: boolean;
+    /** Whether to use fallback extraction methods when JSON parsing fails */
+    useFallbacks?: boolean;
+}
+
+/**
+ * Structure of a tool call extracted from an LLM response
+ */
+export interface ExtractedToolCall {
+    /** The name of the tool to call */
+    tool_name: string;
+    /** Parameters for the tool call */
+    parameters: Record<string, any>;
+    /** The original JSON string that was parsed */
+    originalJson?: string;
+}
+
+/**
+ * Utility class for extracting and parsing JSON from LLM responses
+ * Handles malformed JSON, escaping issues, and provides fallback mechanisms
+ */
+export class JsonExtractor {
+    /**
+     * Extract JSON from an LLM response
+     *
+     * @param text - The raw text from an LLM response
+     * @param options - Options to control extraction behavior
+     * @returns The parsed JSON object or array, or null if extraction failed
+     */
+    static extract<T = any>(text: string, options: JsonExtractionOptions = {}): T | null {
+        const opts = {
+            extractArrays: false,
+            minStringLength: 3,
+            applyFixes: true,
+            useFallbacks: true,
+            ...options
+        };
+
+        try {
+            // Clean up the input text
+            let cleanedText = this.cleanMarkdownAndFormatting(text);
+
+            // Try to extract specific JSON structures if needed
+            if (opts.extractArrays) {
+                const arrayResult = this.extractArray(cleanedText, opts);
+                if (arrayResult) {
+                    return arrayResult as unknown as T;
+                }
+            }
+
+            // Try direct JSON parsing with fixes if enabled
+            if (opts.applyFixes) {
+                const fixedResult = this.extractWithFixes(cleanedText);
+                if (fixedResult !== null) {
+                    return fixedResult as T;
+                }
+            }
+
+            // Try direct JSON parsing without fixes
+            try {
+                return JSON.parse(cleanedText) as T;
+            } catch (e) {
+                // Fall through to fallbacks
+            }
+
+            // Use fallbacks if enabled
+            if (opts.useFallbacks) {
+                if (opts.extractArrays) {
+                    const items = this.extractItemsAsFallback(text, opts.minStringLength);
+                    if (items.length > 0) {
+                        return items as unknown as T;
+                    }
+                }
+
+                // If it looks like a JSON object but can't be parsed, try regex extraction
+                if (cleanedText.includes('{') && cleanedText.includes('}')) {
+                    const objectResult = this.extractObject(cleanedText);
+                    if (objectResult) {
+                        return objectResult as T;
+                    }
+                }
+            }
+
+            return null;
+        } catch (error) {
+            log.error(`JSON extraction error: ${error}`);
+            return null;
+        }
+    }
+
+    /**
+     * Extract tool calls from an LLM response
+     * Specifically designed to handle Ollama tool call format
+     *
+     * @param text - Raw text from the LLM response
+     * @returns Array of tool calls or empty array if none found
+     */
+    static extractToolCalls(text: string): ExtractedToolCall[] {
+        const toolCalls: ExtractedToolCall[] = [];
+
+        try {
+            // Clean up the text and find all JSON objects
+            const cleanedText = this.cleanMarkdownAndFormatting(text);
+
+            // Try to find complete JSON objects
+            const jsonObjectMatches = this.findJsonObjects(cleanedText);
+
+            for (const jsonString of jsonObjectMatches) {
+                try {
+                    // Try to fix and parse each potential JSON object
+                    const fixedJson = this.applyJsonFixes(jsonString);
+                    const parsedJson = JSON.parse(fixedJson);
+
+                    // Check if this looks like a tool call
+                    if (
+                        parsedJson &&
+                        typeof parsedJson === 'object' &&
+                        parsedJson.tool_name &&
+                        typeof parsedJson.tool_name === 'string' &&
+                        parsedJson.parameters &&
+                        typeof parsedJson.parameters === 'object'
+                    ) {
+                        toolCalls.push({
+                            tool_name: parsedJson.tool_name,
+                            parameters: parsedJson.parameters,
+                            originalJson: jsonString
+                        });
+                    }
+                } catch (e) {
+                    // If this JSON object failed to parse, try more aggressive fixes
+                    log.info(`Failed to parse potential tool call JSON: ${e}`);
+                }
+            }
+
+            // If we couldn't find valid tool calls with the first approach, try regex pattern matching
+            if (toolCalls.length === 0) {
+                // Look for tool_name/parameters patterns in the text
+                const toolNameMatch = text.match(/["']?tool_name["']?\s*:\s*["']([^"']+)["']/);
+                const parametersMatch = text.match(/["']?parameters["']?\s*:\s*({[^}]+})/);
+
+                if (toolNameMatch && parametersMatch) {
+                    try {
+                        const toolName = toolNameMatch[1];
+                        const parametersStr = this.applyJsonFixes(parametersMatch[1]);
+                        const parameters = JSON.parse(parametersStr);
+
+                        toolCalls.push({
+                            tool_name: toolName,
+                            parameters,
+                            originalJson: `{"tool_name":"${toolName}","parameters":${parametersStr}}`
+                        });
+                    } catch (e) {
+                        log.info(`Failed to parse tool call with regex approach: ${e}`);
+                    }
+                }
+            }
+        } catch (error) {
+            log.error(`Error extracting tool calls: ${error}`);
+        }
+
+        return toolCalls;
+    }
+
+    /**
+     * Find all potential JSON objects in a text
+     */
+    private static findJsonObjects(text: string): string[] {
+        const jsonObjects: string[] = [];
+        let bracesCount = 0;
+        let currentObject = '';
+        let insideObject = false;
+
+        // Scan through text character by character
+        for (let i = 0; i < text.length; i++) {
+            const char = text[i];
+
+            if (char === '{') {
+                bracesCount++;
+                if (!insideObject) {
+                    insideObject = true;
+                    currentObject = '{';
+                } else {
+                    currentObject += char;
+                }
+            } else if (char === '}') {
+                bracesCount--;
+                currentObject += char;
+
+                if (bracesCount === 0 && insideObject) {
+                    jsonObjects.push(currentObject);
+                    currentObject = '';
+                    insideObject = false;
+                }
+            } else if (insideObject) {
+                currentObject += char;
+            }
+        }
+
+        return jsonObjects;
+    }
+
+    /**
+     * Clean Markdown formatting and special characters from text
+     */
+    private static cleanMarkdownAndFormatting(text: string): string {
+        return text
+            .replace(/```(?:json)?|```/g, '') // Remove code block markers
+            .replace(/[\u201C\u201D]/g, '"')  // Replace smart quotes with straight quotes
+            .trim();
+    }
+
+    /**
+     * Extract an array from text using regex and pattern matching
+     */
+    private static extractArray(text: string, options: JsonExtractionOptions): string[] | null {
+        // First attempt: Find JSON arrays via regex
+        const arrayPattern = /\[((?:"(?:\\.|[^"\\])*"(?:\s*,\s*)?)+)\]/g;
+        const matches = [...text.matchAll(arrayPattern)];
+
+        if (matches.length > 0) {
+            // Take the first complete array match
+            const arrayContent = matches[0][1];
+
+            // Extract all properly quoted strings from the array
+            const stringPattern = /"((?:\\.|[^"\\])*)"/g;
+            const stringMatches = [...arrayContent.matchAll(stringPattern)];
+
+            if (stringMatches.length > 0) {
+                const items = stringMatches
+                    .map(m => m[1].trim())
+                    .filter(s => s.length >= (options.minStringLength || 3));
+
+                if (items.length > 0) {
+                    log.info(`Successfully extracted ${items.length} items using regex pattern`);
+                    return items;
+                }
+            }
+        }
+
+        // Second attempt: Try to extract array via standard JSON parsing with fixes
+        if (text.includes('[') && text.includes(']')) {
+            const arrayMatch = text.match(/\[[\s\S]*\]/);
+            if (arrayMatch) {
+                const arrayText = this.applyJsonFixes(arrayMatch[0]);
+
+                try {
+                    const array = JSON.parse(arrayText);
+                    if (Array.isArray(array) && array.length > 0) {
+                        const items = array
+                            .map(item => typeof item === 'string' ? item : String(item))
+                            .filter(s => s.length >= (options.minStringLength || 3));
+
+                        if (items.length > 0) {
+                            log.info(`Successfully parsed JSON array with ${items.length} items`);
+                            return items;
+                        }
+                    }
+                } catch (e) {
+                    // Fall through to fallbacks
+                }
+            }
+        }
+
+        return null;
+    }
+
+    /**
+     * Extract a JSON object using regex and pattern matching
+     */
+    private static extractObject(text: string): Record<string, any> | null {
+        const objectMatch = text.match(/{[\s\S]*}/);
+        if (!objectMatch) return null;
+
+        const objectText = this.applyJsonFixes(objectMatch[0]);
+
+        try {
+            const parsed = JSON.parse(objectText);
+            return parsed;
+        } catch (e) {
+            return null;
+        }
+    }
+
+    /**
+     * Apply fixes to malformed JSON text
+     */
+    private static applyJsonFixes(text: string): string {
+        let fixed = text;
+
+        // Fix common JSON formatting issues - replace newlines inside the JSON
+        fixed = fixed.replace(/\r?\n/g, ' ');
+
+        // Fix unclosed quotes - replace trailing commas before closing brackets
+        fixed = fixed.replace(/,\s*]/g, ']');
+        fixed = fixed.replace(/,\s*}/g, '}');
+
+        // Fix quotes inside strings
+        fixed = fixed.replace(/"([^"]*)"([^"]*)"([^"]*)"/g, '"$1\'$2\'$3"');
+
+        // Fix missing commas between elements
+        fixed = fixed.replace(/"([^"]*)"(?:\s+)"([^"]*)"/g, '"$1", "$2"');
+
+        // Fix missing commas in arrays (quotes with only spaces between them)
+        fixed = fixed.replace(/"([^"]*)"\s+"/g, '"$1", "');
+
+        // Fix unclosed quotes before commas
+        fixed = fixed.replace(/"([^"]*),\s*(?="|])/g, '"$1", ');
+
+        return fixed;
+    }
+
+    /**
+     * Extract with fixes and direct JSON parsing
+     */
+    private static extractWithFixes(text: string): any | null {
+        try {
+            const fixed = this.applyJsonFixes(text);
+            return JSON.parse(fixed);
+        } catch (e) {
+            return null;
+        }
+    }
+
+    /**
+     * Extract items as a fallback using various patterns
+     */
+    private static extractItemsAsFallback(text: string, minLength: number = 3): string[] {
+        const patterns = [
+            /(?:^|\n)["'](.+?)["'](?:,|\n|$)/g,       // Quoted strings
+            /(?:^|\n)\[["'](.+?)["']\](?:,|\n|$)/g,   // Single item arrays
+            /(?:^|\n)(\d+\.\s*.+?)(?:\n|$)/g,         // Numbered list items
+            /(?:^|\n)[-*•]\s*(.+?)(?:\n|$)/g          // Bullet list items
+        ];
+
+        const extractedItems = new Set<string>();
+
+        // Try each pattern
+        for (const pattern of patterns) {
+            const matches = [...text.matchAll(pattern)];
+            for (const match of matches) {
+                if (match[1] && match[1].trim().length >= minLength) {
+                    extractedItems.add(match[1].trim());
+                }
+            }
+        }
+
+        // Try line-by-line extraction as last resort
+        if (extractedItems.size === 0) {
+            const lines = text.split('\n')
+                .map(line => line.trim())
+                .filter(line =>
+                    line.length >= minLength &&
+                    !line.startsWith('```') &&
+                    !line.match(/^\d+\.?\s*$/) && // Skip numbered list markers alone
+                    !line.match(/^\[|\]$/) // Skip lines that are just brackets
+                );
+
+            for (const line of lines) {
+                // Remove common formatting
+                const cleaned = line
+                    .replace(/^\d+\.?\s*/, '') // Remove numbered list markers
+                    .replace(/^[-*•]\s*/, '')  // Remove bullet list markers
+                    .replace(/^["']|["']$/g, '') // Remove surrounding quotes
+                    .trim();
+
+                if (cleaned.length >= minLength) {
+                    extractedItems.add(cleaned);
+                }
+            }
+        }
+
+        return Array.from(extractedItems);
+    }
+}
+
+export default JsonExtractor;
diff --git a/src/services/migration.ts b/src/services/migration.ts
index d73e34253..c39fc9e2a 100644
--- a/src/services/migration.ts
+++ b/src/services/migration.ts
@@ -98,7 +98,9 @@ async function prepareMigrations(currentDbVersion: number): Promise<MigrationInf
             if (type === "js" || type === "ts") {
                 // Due to ESM imports, the migration file needs to be imported asynchronously and thus cannot be loaded at migration time (since migration is not asynchronous).
                 // As such we have to preload the ESM.
-                migration.module = (await import(`file://${resourceDir.MIGRATIONS_DIR}/${file}`)).default;
+                // Going back to the original approach but making it webpack-compatible
+                const importPath = `../../db/migrations/${file}`;
+                migration.module = (await import(importPath)).default;
             }
 
             migrations.push(migration);
diff --git a/src/services/note_types.ts b/src/services/note_types.ts
index a242fc7b2..3b2dc8d66 100644
--- a/src/services/note_types.ts
+++ b/src/services/note_types.ts
@@ -15,7 +15,8 @@ const noteTypes = [
     { type: "doc", defaultMime: "" },
     { type: "contentWidget", defaultMime: "" },
     { type: "mindMap", defaultMime: "application/json" },
-    { type: "geoMap", defaultMime: "application/json" }
+    { type: "geoMap", defaultMime: "application/json" },
+    { type: "aiChat", defaultMime: "application/json" }
 ];
 
 function getDefaultMimeForNoteType(typeName: string) {
diff --git a/src/services/options_init.ts b/src/services/options_init.ts
index 52417bbb2..b4092367f 100644
--- a/src/services/options_init.ts
+++ b/src/services/options_init.ts
@@ -176,7 +176,38 @@ const defaultOptions: DefaultOption[] = [
 
     // Share settings
     { name: "redirectBareDomain", value: "false", isSynced: true },
-    { name: "showLoginInShareTheme", value: "false", isSynced: true }
+    { name: "showLoginInShareTheme", value: "false", isSynced: true },
+
+    // AI Options
+    { name: "aiEnabled", value: "false", isSynced: true },
+    { name: "openaiApiKey", value: "", isSynced: false },
+    { name: "openaiDefaultModel", value: "gpt-4o", isSynced: true },
+    { name: "openaiEmbeddingModel", value: "text-embedding-3-small", isSynced: true },
+    { name: "openaiBaseUrl", value: "https://api.openai.com/v1", isSynced: true },
+    { name: "anthropicApiKey", value: "", isSynced: false },
+    { name: "anthropicDefaultModel", value: "claude-3-opus-20240229", isSynced: true },
+    { name: "voyageEmbeddingModel", value: "voyage-2", isSynced: true },
+    { name: "voyageApiKey", value: "", isSynced: false },
+    { name: "anthropicBaseUrl", value: "https://api.anthropic.com/v1", isSynced: true },
+    { name: "ollamaEnabled", value: "false", isSynced: true },
+    { name: "ollamaDefaultModel", value: "llama3", isSynced: true },
+    { name: "ollamaBaseUrl", value: "", isSynced: true },
+    { name: "ollamaEmbeddingModel", value: "nomic-embed-text", isSynced: true },
+    { name: "embeddingAutoUpdateEnabled", value: "true", isSynced: true },
+
+    // Adding missing AI options
+    { name: "aiTemperature", value: "0.7", isSynced: true },
+    { name: "aiSystemPrompt", value: "", isSynced: true },
+    { name: "aiProviderPrecedence", value: "openai,anthropic,ollama", isSynced: true },
+    { name: "embeddingDimensionStrategy", value: "auto", isSynced: true },
+    { name: "embeddingProviderPrecedence", value: "openai,voyage,ollama,local", isSynced: true },
+    { name: "embeddingSimilarityThreshold", value: "0.75", isSynced: true },
+    { name: "enableAutomaticIndexing", value: "true", isSynced: true },
+    { name: "maxNotesPerLlmQuery", value: "3", isSynced: true },
+    { name: "embeddingBatchSize", value: "10", isSynced: true },
+    { name: "embeddingUpdateInterval", value: "5000", isSynced: true },
+    { name: "embeddingDefaultDimension", value: "1536", isSynced: true },
+    { name: "embeddingGenerationLocation", value: "client", isSynced: true },
 ];
 
 /**
diff --git a/src/services/options_interface.ts b/src/services/options_interface.ts
index 07b89ebe2..99e8a86f6 100644
--- a/src/services/options_interface.ts
+++ b/src/services/options_interface.ts
@@ -117,9 +117,44 @@ export interface OptionDefinitions extends KeyboardShortcutsOptions<KeyboardActi
     codeBlockWordWrap: boolean;
     textNoteEditorMultilineToolbar: boolean;
     backgroundEffects: boolean;
+
     // Share settings
     redirectBareDomain: boolean;
     showLoginInShareTheme: boolean;
+
+    // AI/LLM integration options
+    aiEnabled: boolean;
+    aiProvider: string;
+    aiSystemPrompt: string;
+    aiTemperature: string;
+    openaiApiKey: string;
+    openaiDefaultModel: string;
+    openaiEmbeddingModel: string;
+    openaiBaseUrl: string;
+    anthropicApiKey: string;
+    anthropicDefaultModel: string;
+    voyageEmbeddingModel: string;
+    voyageApiKey: string;
+    anthropicBaseUrl: string;
+    ollamaEnabled: boolean;
+    ollamaBaseUrl: string;
+    ollamaDefaultModel: string;
+    ollamaEmbeddingModel: string;
+    codeOpenAiModel: string;
+    aiProviderPrecedence: string;
+
+    // Embedding-related options
+    embeddingAutoUpdateEnabled: boolean;
+    embeddingUpdateInterval: number;
+    embeddingBatchSize: number;
+    embeddingDefaultDimension: number;
+    embeddingsDefaultProvider: string;
+    embeddingProviderPrecedence: string;
+    enableAutomaticIndexing: boolean;
+    embeddingGenerationLocation: string;
+    embeddingDimensionStrategy: string;
+    embeddingSimilarityThreshold: number;
+    maxNotesPerLlmQuery: number;
 }
 
 export type OptionNames = keyof OptionDefinitions;
diff --git a/src/services/sql_init.ts b/src/services/sql_init.ts
index 3ba0bfc5d..e2b14edc6 100644
--- a/src/services/sql_init.ts
+++ b/src/services/sql_init.ts
@@ -17,6 +17,7 @@ import zipImportService from "./import/zip.js";
 import becca_loader from "../becca/becca_loader.js";
 import password from "./encryption/password.js";
 import backup from "./backup.js";
+import eventService from "./events.js";
 
 const dbReady = deferred<void>();
 
@@ -176,6 +177,11 @@ function setDbAsInitialized() {
         optionService.setOption("initialized", "true");
 
         initDbConnection();
+
+        // Emit an event to notify that the database is now initialized
+        eventService.emit(eventService.DB_INITIALIZED);
+
+        log.info("Database initialization completed, emitted DB_INITIALIZED event");
     }
 }
 
diff --git a/src/services/sync.ts b/src/services/sync.ts
index 47985b4bd..f852a567f 100644
--- a/src/services/sync.ts
+++ b/src/services/sync.ts
@@ -364,6 +364,15 @@ function getEntityChangeRow(entityChange: EntityChange) {
             }
         }
 
+        // Special handling for note_embeddings embedding field
+        if (entityName === "note_embeddings") {
+            // Cast to any to access the embedding property
+            const row = entityRow as any;
+            if (row.embedding && Buffer.isBuffer(row.embedding)) {
+                row.embedding = row.embedding.toString("base64");
+            }
+        }
+
         return entityRow;
     }
 }
diff --git a/src/services/sync_update.ts b/src/services/sync_update.ts
index c6c0228a1..19edbf759 100644
--- a/src/services/sync_update.ts
+++ b/src/services/sync_update.ts
@@ -52,7 +52,11 @@ function updateEntity(remoteEC: EntityChange, remoteEntityRow: EntityRow | undef
         return; // can be undefined for options with isSynced=false
     }
 
-    const updated = remoteEC.entityName === "note_reordering" ? updateNoteReordering(remoteEC, remoteEntityRow, instanceId) : updateNormalEntity(remoteEC, remoteEntityRow, instanceId, updateContext);
+    const updated = remoteEC.entityName === "note_reordering"
+        ? updateNoteReordering(remoteEC, remoteEntityRow, instanceId)
+        : (remoteEC.entityName === "note_embeddings"
+            ? updateNoteEmbedding(remoteEC, remoteEntityRow, instanceId, updateContext)
+            : updateNormalEntity(remoteEC, remoteEntityRow, instanceId, updateContext));
 
     if (updated) {
         if (remoteEntityRow?.isDeleted) {
@@ -141,10 +145,78 @@ function updateNoteReordering(remoteEC: EntityChange, remoteEntityRow: EntityRow
     return true;
 }
 
+function updateNoteEmbedding(remoteEC: EntityChange, remoteEntityRow: EntityRow | undefined, instanceId: string, updateContext: UpdateContext) {
+    if (remoteEC.isErased) {
+        eraseEntity(remoteEC);
+        updateContext.erased++;
+        return true;
+    }
+
+    if (!remoteEntityRow) {
+        log.error(`Entity ${remoteEC.entityName} ${remoteEC.entityId} not found in sync update.`);
+        return false;
+    }
+
+    interface NoteEmbeddingRow {
+        embedId: string;
+        noteId: string;
+        providerId: string;
+        modelId: string;
+        dimension: number;
+        embedding: Buffer;
+        version: number;
+        dateCreated: string;
+        utcDateCreated: string;
+        dateModified: string;
+        utcDateModified: string;
+    }
+
+    // Cast remoteEntityRow to include required embedding properties
+    const typedRemoteEntityRow = remoteEntityRow as unknown as NoteEmbeddingRow;
+
+    // Convert embedding from base64 string to Buffer if needed
+    if (typedRemoteEntityRow.embedding && typeof typedRemoteEntityRow.embedding === "string") {
+        typedRemoteEntityRow.embedding = Buffer.from(typedRemoteEntityRow.embedding, "base64");
+    }
+
+    const localEntityRow = sql.getRow<NoteEmbeddingRow>(`SELECT * FROM note_embeddings WHERE embedId = ?`, [remoteEC.entityId]);
+
+    if (localEntityRow) {
+        // We already have this embedding, check if we need to update it
+        if (localEntityRow.utcDateModified >= typedRemoteEntityRow.utcDateModified) {
+            // Local is newer or same, no need to update
+            entityChangesService.putEntityChangeWithInstanceId(remoteEC, instanceId);
+            return true;
+        } else {
+            // Remote is newer, update local
+            sql.replace("note_embeddings", remoteEntityRow);
+
+            if (!updateContext.updated[remoteEC.entityName]) {
+                updateContext.updated[remoteEC.entityName] = [];
+            }
+            updateContext.updated[remoteEC.entityName].push(remoteEC.entityId);
+
+            entityChangesService.putEntityChangeWithInstanceId(remoteEC, instanceId);
+            return true;
+        }
+    } else {
+        // We don't have this embedding, insert it
+        sql.replace("note_embeddings", remoteEntityRow);
+
+        if (!updateContext.updated[remoteEC.entityName]) {
+            updateContext.updated[remoteEC.entityName] = [];
+        }
+        updateContext.updated[remoteEC.entityName].push(remoteEC.entityId);
+
+        entityChangesService.putEntityChangeWithInstanceId(remoteEC, instanceId);
+        return true;
+    }
+}
+
 function eraseEntity(entityChange: EntityChange) {
     const { entityName, entityId } = entityChange;
 
-    const entityNames = ["notes", "branches", "attributes", "revisions", "attachments", "blobs"];
+    const entityNames = ["notes", "branches", "attributes", "revisions", "attachments", "blobs", "note_embeddings"];
 
     if (!entityNames.includes(entityName)) {
         log.error(`Cannot erase ${entityName} '${entityId}'.`);
diff --git a/src/services/ws.ts b/src/services/ws.ts
index a405500e6..d02db8a40 100644
--- a/src/services/ws.ts
+++ b/src/services/ws.ts
@@ -56,6 +56,22 @@ interface Message {
     originEntityId?: string | null;
     lastModifiedMs?: number;
     filePath?: string;
+
+    // LLM streaming specific fields
+    chatNoteId?: string;
+    content?: string;
+    thinking?: string;
+    toolExecution?: {
+        action?: string;
+        tool?: string;
+        toolCallId?: string;
+        result?: string | Record<string, any>;
+        error?: string;
+        args?: Record<string, unknown>;
+    };
+    done?: boolean;
+    error?: string;
+    raw?: unknown;
 }
 
 type SessionParser = (req: IncomingMessage, params: {}, cb: () => void) => void;
@@ -115,15 +131,25 @@ function sendMessageToAllClients(message: Message) {
     const jsonStr = JSON.stringify(message);
 
     if (webSocketServer) {
-        if (message.type !== "sync-failed" && message.type !== "api-log-messages") {
+        // Special logging for LLM streaming messages
+        if (message.type === "llm-stream") {
+            log.info(`[WS-SERVER] Sending LLM stream message: chatNoteId=${message.chatNoteId}, content=${!!message.content}, thinking=${!!message.thinking}, toolExecution=${!!message.toolExecution}, done=${!!message.done}`);
+        } else if (message.type !== "sync-failed" && message.type !== "api-log-messages") {
             log.info(`Sending message to all clients: ${jsonStr}`);
         }
 
+        let clientCount = 0;
         webSocketServer.clients.forEach(function each(client) {
             if (client.readyState === WebSocket.OPEN) {
                 client.send(jsonStr);
+                clientCount++;
             }
         });
+
+        // Log WebSocket client count for debugging
+        if (message.type === "llm-stream") {
+            log.info(`[WS-SERVER] Sent LLM stream message to ${clientCount} clients`);
+        }
     }
 }
 
@@ -207,7 +233,8 @@ const ORDERING: Record<string, number> = {
     revisions: 2,
     attachments: 3,
     notes: 1,
-    options: 0
+    options: 0,
+    note_embeddings: 3
 };
 
 function sendPing(client: WebSocket, entityChangeIds = []) {
diff --git a/translations/en/server.json b/translations/en/server.json
index 259c099d0..df91eee91 100644
--- a/translations/en/server.json
+++ b/translations/en/server.json
@@ -234,6 +234,7 @@
     "protected-session-title": "Protected Session",
     "sync-status-title": "Sync Status",
     "settings-title": "Settings",
+    "llm-chat-title": "Chat with Notes",
     "options-title": "Options",
     "appearance-title": "Appearance",
     "shortcuts-title": "Shortcuts",
@@ -246,11 +247,13 @@
     "etapi-title": "ETAPI",
     "backup-title": "Backup",
     "sync-title": "Sync",
+    "ai-llm-title": "AI/LLM",
     "other": "Other",
     "advanced-title": "Advanced",
     "visible-launchers-title": "Visible Launchers",
     "user-guide": "User Guide",
-    "localization": "Language & Region"
+    "localization": "Language & Region",
+    "inbox-title": "Inbox"
   },
   "notes": {
     "new-note": "New note",