docker
diff --git a/‎.gitignore‎
Lines changed: 2 additions & 1 deletion b/‎.gitignore‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎README.md‎
Lines changed: 85 additions & 0 deletions b/‎README.md‎
Lines changed: 85 additions & 0 deletions
diff --git a/‎cagent-schema.json‎
Lines changed: 193 additions & 0 deletions b/‎cagent-schema.json‎
Lines changed: 193 additions & 0 deletions
diff --git a/‎cmd/root/new.go‎
Lines changed: 1 addition & 1 deletion b/‎cmd/root/new.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎cmd/root/run.go‎
Lines changed: 1 addition & 1 deletion b/‎cmd/root/run.go‎
Lines changed: 1 addition & 1 deletion
@@ -3,10 +3,11 @@ dist
 .task
 .DS_Store
 evals
-*.db
+*.db*
 /cagent
 .crush
 .vscode
+*.debug
 
 # agents
 agent.yaml
 
@@ -145,6 +145,8 @@ See [MCP Mode documentation](./docs/MCP-MODE.md) for detailed instructions on ex
 - **📝 YAML configuration** - Declarative model and agent configuration.
 - **💭 Advanced reasoning** - Built-in "think", "todo" and "memory" tools for
   complex problem-solving.
+- **🔍 RAG (Retrieval-Augmented Generation)** - Pluggable retrieval strategies
+  (chunked_embeddings, BM25, more to come..) with hybrid retrieval and fusion support.
 - **🌐 Multiple AI providers** - Support for OpenAI, Anthropic, Gemini, xA,
   Mistral, Nebius and [Docker Model
   Runner](https://docs.docker.com/ai/model-runner/).
@@ -292,6 +294,89 @@ Linux](https://docs.docker.com/ai/model-runner/get-started/#enable-dmr-in-docker
 
 See the [DMR Provider documentation](docs/USAGE.md#dmr-docker-model-runner-provider-usage) for more details on runtime flags and speculative decoding options.
 
+## RAG (Retrieval-Augmented Generation)
+
+Give your agents access to your documents with cagent's modular RAG system. It supports multiple retrieval strategies that can be used individually or combined for hybrid search.
+
+### Quick RAG Example
+
+```yaml
+models:
+  embedder:
+    provider: openai
+    model: text-embedding-3-small
+
+rag:
+  my_knowledge_base:
+    docs: [./documents, ./pdfs]
+    strategies:
+      - type: chunked-embeddings
+        model: embedder
+        threshold: 0.5
+        chunking:
+          size: 1000
+          overlap: 100
+    results:
+      limit: 5
+
+agents:
+  root:
+    model: openai/gpt-4o
+    instruction: |
+      You are an assistant with access to an internal knowledge base.
+      Use the knowledge base to gather context before answering user questions
+    rag: [my_knowledge_base]
+```
+
+### Hybrid Retrieval (Chunked-Embeddings + BM25)
+
+Combine semantic search (chunked-embeddings) with keyword search (BM25) for best results:
+
+```yaml
+rag:
+  hybrid_search:
+    docs: [./shared_docs]
+    
+    strategies:
+      - type: chunked-embeddings
+        model: embedder
+        threshold: 0.5
+        limit: 20
+        chunking:
+          size: 1000
+          overlap: 100
+      
+      - type: bm25
+        k1: 1.5
+        b: 0.75
+        threshold: 0.3
+        limit: 15
+        chunking:
+          size: 1000
+          overlap: 100
+    
+    results:
+      fusion:
+        strategy: rrf  # Reciprocal Rank Fusion
+        k: 60
+      deduplicate: true
+      limit: 5
+
+agents:
+  root:
+    model: openai/gpt-4o
+    rag: [hybrid_search]
+```
+
+**Features:**
+- **Multiple strategies**: Vector (semantic), BM25 (keyword), or both
+- **Parallel execution**: Strategies run concurrently for fast results
+- **Pluggable fusion**: RRF, weighted, or max score combining
+- **Per-strategy configuration**: Different thresholds, limits, and documents
+- **Auto file watching**: Reindex automatically on file changes
+
+See the [RAG documentation](docs/RAG.md) for complete details, examples, and debugging guides.
+
 ## Quickly generate agents and agent teams with `cagent new`
 
 Using the command `cagent new` you can quickly generate agents or multi-agent
 
@@ -33,6 +33,13 @@
         "$ref": "#/definitions/ModelConfig"
       }
     },
+    "rag": {
+      "type": "object",
+      "description": "Map of RAG (Retrieval-Augmented Generation) configurations",
+      "additionalProperties": {
+        "$ref": "#/definitions/RAGConfig"
+      }
+    },
     "metadata": {
       "$ref": "#/definitions/Metadata",
       "description": "Configuration metadata"
@@ -188,6 +195,13 @@
             "schema"
           ],
           "additionalProperties": false
+        },
+        "rag": {
+          "type": "array",
+          "description": "List of RAG sources to use for this agent",
+          "items": {
+            "type": "string"
+          }
         }
       },
       "additionalProperties": false
@@ -625,6 +639,185 @@
         "method"
       ],
       "additionalProperties": false
+    },
+    "RAGConfig": {
+      "type": "object",
+      "description": "RAG (Retrieval-Augmented Generation) configuration for document search and retrieval with pluggable strategies. Multiple strategies enable hybrid retrieval and reranking.",
+      "properties": {
+        "description": {
+          "type": "string",
+          "description": "Description of the RAG source"
+        },
+        "docs": {
+          "type": "array",
+          "description": "Shared document paths or directories indexed by all strategies",
+          "items": {
+            "type": "string"
+          }
+        },
+        "strategies": {
+          "type": "array",
+          "description": "Array of retrieval strategy configurations. Each strategy can have different parameters based on its type.",
+          "minItems": 1,
+          "items": {
+            "type": "object",
+            "description": "Retrieval strategy configuration with type-specific parameters. Structured fields are limited; additional parameters are passed through as-is for strategy-specific use.",
+            "required": ["type"],
+            "properties": {
+              "type": {
+                "type": "string",
+                "description": "Retrieval strategy type",
+                "enum": ["chunked-embeddings", "bm25"]
+              },
+              "model": {
+                "type": "string",
+                "description": "Embedding model reference for chunked-embeddings strategies (looked up in models map, or 'auto' for automatic selection)",
+                "examples": ["openai/text-embedding-3-small", "dmr/embeddinggemma", "auto"]
+              },
+              "docs": {
+                "type": "array",
+                "description": "Additional documents for this strategy only (augments shared docs)",
+                "items": {
+                  "type": "string"
+                }
+              },
+              "database": {
+                "type": "string",
+                "description": "Database path or connection string. Currently only simple string values are supported (e.g., './vector.db', './bm25.db')."
+              },
+              "similarity_metric": {
+                "type": "string",
+                "description": "Similarity metric (chunked-embeddings only). Currently only 'cosine_similarity' is implemented.",
+                "enum": ["cosine_similarity"]
+              },
+              "vector_dimensions": {
+                "type": "integer",
+                "description": "Vector dimensions for embeddings (chunked-embeddings only). Must match your embedding model's output dimensions and is required for chunked-embeddings strategies.",
+                "minimum": 1,
+                "examples": [1536, 3072, 1024, 768]
+              },
+              "k1": {
+                "type": "number",
+                "description": "BM25 term frequency saturation (bm25 only, typically 1.2-2.0)",
+                "minimum": 0
+              },
+              "b": {
+                "type": "number",
+                "description": "BM25 length normalization (bm25 only, 0-1, typically 0.75)",
+                "minimum": 0,
+                "maximum": 1
+              },
+              "threshold": {
+                "type": "number",
+                "description": "Minimum score threshold (0-1 for chunked-embeddings, unbounded for bm25)",
+                "minimum": 0
+              },
+              "limit": {
+                "type": "integer",
+                "description": "Max results from this strategy (candidates for fusion). If unset, defaults to 5 in the implementation.",
+                "minimum": 1
+              },
+              "chunking": {
+                "type": "object",
+                "description": "Text chunking configuration",
+                "properties": {
+                  "size": {
+                    "type": "integer",
+                    "description": "Chunk size in characters. If unset, defaults to 1000 in the implementation.",
+                    "minimum": 1
+                  },
+                  "overlap": {
+                    "type": "integer",
+                    "description": "Overlap between chunks in characters. If unset, defaults to 75 in the implementation.",
+                    "minimum": 0
+                  },
+                  "respect_word_boundaries": {
+                    "type": "boolean",
+                    "description": "When true, chunks will split on the nearest whitespace boundary instead of at the exact character limit, preventing words from being truncated."
+                  }
+                },
+                "additionalProperties": false
+              }
+            },
+            "additionalProperties": true
+          }
+        },
+        "results": {
+          "type": "object",
+          "description": "Result post-processing configuration (fusion, deduplication, limiting). If omitted, sensible defaults are applied in code.",
+          "properties": {
+            "limit": {
+              "type": "integer",
+              "description": "Maximum number of results to return (top K)",
+              "minimum": 1,
+              "default": 15
+            },
+            "fusion": {
+              "type": "object",
+              "description": "Configuration for combining results from multiple strategies. If omitted and multiple strategies are configured, Reciprocal Rank Fusion (rrf) with k=60 is used.",
+              "properties": {
+                "strategy": {
+                  "type": "string",
+                  "description": "Fusion strategy to use",
+                  "enum": [
+                    "rrf",
+                    "reciprocal_rank_fusion",
+                    "weighted",
+                    "max"
+                  ],
+                  "default": "rrf",
+                  "examples": [
+                    "rrf",
+                    "weighted"
+                  ]
+                },
+                "k": {
+                  "type": "integer",
+                  "description": "RRF smoothing parameter k (only for RRF strategy)",
+                  "minimum": 1,
+                  "default": 60
+                },
+                "weights": {
+                  "type": "object",
+                  "description": "Strategy weights for weighted fusion (strategy name -> weight)",
+                  "additionalProperties": {
+                    "type": "number",
+                    "minimum": 0,
+                    "maximum": 1
+                  },
+                  "examples": [
+                    {
+                      "chunked-embeddings": 0.7,
+                      "bm25": 0.3
+                    }
+                  ]
+                }
+              },
+              "additionalProperties": false
+            },
+            "deduplicate": {
+              "type": "boolean",
+              "description": "Remove duplicate documents across strategies",
+              "default": true
+            },
+            "include_score": {
+              "type": "boolean",
+              "description": "Include relevance scores in results",
+              "default": false
+            },
+            "return_full_content": {
+              "type": "boolean",
+              "description": "Return full document content instead of just the matched chunk. The full document is read directly from the file system.",
+              "default": false
+            }
+          },
+          "additionalProperties": false
+        }
+      },
+      "required": [
+        "strategies"
+      ],
+      "additionalProperties": false
     }
   }
 }
@@ -68,7 +68,7 @@ func (f *newFlags) runNewCommand(cmd *cobra.Command, args []string) error {
 
 	sess := session.New(opts...)
 
-	a := app.New("", rt, sess, prompt)
+	a := app.New(ctx, "", rt, sess, prompt)
 	m := tui.New(a)
 
 	progOpts := []tea.ProgramOption{
 
@@ -240,7 +240,7 @@ func handleRunMode(ctx context.Context, agentFilename string, rt runtime.Runtime
 		return err
 	}
 
-	a := app.New(agentFilename, rt, sess, firstMessage)
+	a := app.New(ctx, agentFilename, rt, sess, firstMessage)
 	m := tui.New(a)
 
 	progOpts := []tea.ProgramOption{
Original file line number	Diff line number	Diff line change
`@@ -240,7 +240,7 @@ func handleRunMode(ctx context.Context, agentFilename string, rt runtime.Runtime`
`240`	`240`	`return err`
`241`	`241`	`}`
`242`	`242`
`243`		`- a := app.New(agentFilename, rt, sess, firstMessage)`
	`243`	`+ a := app.New(ctx, agentFilename, rt, sess, firstMessage)`
`244`	`244`	`m := tui.New(a)`
`245`	`245`
`246`	`246`	`progOpts := []tea.ProgramOption{`