diff --git a/.changeset/document-utils-integration.md b/.changeset/document-utils-integration.md
new file mode 100644
index 000000000..ab77e902f
--- /dev/null
+++ b/.changeset/document-utils-integration.md
@@ -0,0 +1,6 @@
+---
+"@voltagent/documents": minor
+"@voltagent/core": minor
+---
+
+feat: implement document chunking and embedding utilities and integrate into core
diff --git a/biome.json b/biome.json
index e44564076..9b116689a 100644
--- a/biome.json
+++ b/biome.json
@@ -61,7 +61,9 @@
       ".wrangler",
       "packages/server-hono/src/vendor",
       "examples/with-nuxt",
-      "examples/with-assistant-ui"
+      "examples/with-assistant-ui",
+      "archive",
+      "website"
     ]
   },
   "overrides": [
diff --git a/packages/core/package.json b/packages/core/package.json
index d2c16a5e7..69d760918 100644
--- a/packages/core/package.json
+++ b/packages/core/package.json
@@ -16,6 +16,7 @@
     "@opentelemetry/sdk-trace-base": "^2.0.0",
     "@opentelemetry/sdk-trace-node": "^2.0.0",
     "@opentelemetry/semantic-conventions": "^1.28.0",
+    "@voltagent/documents": "workspace:*",
     "@voltagent/internal": "^1.0.2",
     "fast-glob": "^3.3.3",
     "gray-matter": "^4.0.3",
@@ -82,4 +83,4 @@
     "typecheck": "tsc --noEmit"
   },
   "types": "dist/index.d.ts"
-}
+}
\ No newline at end of file
diff --git a/packages/core/src/agent/subagent/index.ts b/packages/core/src/agent/subagent/index.ts
index 343e19cad..4e4bc69c1 100644
--- a/packages/core/src/agent/subagent/index.ts
+++ b/packages/core/src/agent/subagent/index.ts
@@ -316,6 +316,7 @@ ${guidelinesText}
   /**
    * Hand off a task to another agent using AgentV2
    */
+  // biome-ignore lint/complexity/noExcessiveCognitiveComplexity: legacy complexity allowed
   public async handoffTask(options: {
     task: string;
     targetAgent: SubAgentConfig;
diff --git a/packages/core/src/retriever/document-retriever.ts b/packages/core/src/retriever/document-retriever.ts
new file mode 100644
index 000000000..31cbe7b37
--- /dev/null
+++ b/packages/core/src/retriever/document-retriever.ts
@@ -0,0 +1,73 @@
+import { DocumentProcessor, type ProcessedDocument } from "@voltagent/documents";
+import type { BaseMessage } from "../agent/providers";
+import { BaseRetriever } from "./retriever";
+import type { RetrieveOptions, RetrieverOptions } from "./types";
+
+export interface DocumentRetrieverOptions extends RetrieverOptions {
+  /**
+   * Optional custom document processor.
+   * If not provided, a default one will be created.
+   */
+  processor?: DocumentProcessor;
+}
+
+/**
+ * Abstract base class for retrievers that handle document ingestion and vector search.
+ */
+export abstract class DocumentRetriever extends BaseRetriever {
+  protected processor: DocumentProcessor;
+
+  constructor(options: DocumentRetrieverOptions = {}) {
+    super(options);
+    this.processor = options.processor || new DocumentProcessor();
+  }
+
+  /**
+   * Ingests text, chunks it, embeds it, and stores it using upsertDocuments.
+   * @param text The raw text to ingest
+   * @param metadata Optional metadata to attach to all chunks
+   */
+  async ingest(text: string, metadata?: Record<string, any>): Promise<void> {
+    this.logger.debug("Ingesting document text", { length: text.length });
+    const documents = await this.processor.process(text, metadata);
+    await this.upsertDocuments(documents);
+    this.logger.debug("Document ingestion complete", { chunks: documents.length });
+  }
+
+  /**
+   * Abstract method to store processed documents in the underlying storage (e.g., Vector DB).
+   * @param documents The processed documents containing embeddings and metadata
+   */
+  abstract upsertDocuments(documents: ProcessedDocument[]): Promise<void>;
+
+  /**
+   * Abstract method to retrieve documents based on a query vector.
+   * This is a helper for the main retrieve method.
+   * @param vector The query vector
+   * @param k Number of results to return
+   */
+  abstract queryVectors(vector: number[], k: number): Promise<ProcessedDocument[]>;
+
+  /**
+   * Default implementation of retrieve that embeds the query and searches vectors.
+   * Can be overridden if needed.
+   */
+  async retrieve(input: string | BaseMessage[], options: RetrieveOptions = {}): Promise<string> {
+    if (Array.isArray(input) && input.length === 0) {
+      return "";
+    }
+    const textQuery = typeof input === "string" ? input : input[input.length - 1].content;
+
+    // We assume the processor's embedder has an embedQuery method.
+    // Since DocumentProcessor exposes 'embedder', we can use it.
+    const queryVector = await this.processor.embedder.embedQuery(textQuery as string);
+
+    // Default top-k to 4, can be customizable via options
+    const k = (options as any).k ?? 4;
+
+    const results = await this.queryVectors(queryVector, k);
+
+    // Join the text of the results
+    return results.map((doc) => doc.text).join("\n\n");
+  }
+}
diff --git a/packages/core/src/retriever/index.ts b/packages/core/src/retriever/index.ts
index 422692dd8..1e5f41aa9 100644
--- a/packages/core/src/retriever/index.ts
+++ b/packages/core/src/retriever/index.ts
@@ -3,7 +3,10 @@
  * @module retriever
  */
 
+export type { ProcessedDocument } from "@voltagent/documents";
+
 export { BaseRetriever } from "./retriever";
+export { DocumentRetriever, type DocumentRetrieverOptions } from "./document-retriever";
 export type { Retriever, RetrieverOptions, RetrieveOptions } from "./types";
 export {
   VoltAgentRagRetriever,
diff --git a/packages/documents/README.md b/packages/documents/README.md
new file mode 100644
index 000000000..e2c7e8e8f
--- /dev/null
+++ b/packages/documents/README.md
@@ -0,0 +1,71 @@
+# @voltagent/documents
+
+Utilities for document processing, chunking, and embedding generation.
+
+## Installation
+
+```bash
+pnpm add @voltagent/documents
+```
+
+## Usage
+
+### Text Splitting
+
+Use `RecursiveCharacterTextSplitter` to split text into chunks while preserving context.
+
+```typescript
+import { RecursiveCharacterTextSplitter } from "@voltagent/documents";
+
+const splitter = new RecursiveCharacterTextSplitter({
+  chunkSize: 1000,
+  chunkOverlap: 200,
+});
+
+const text = "Your long text here...";
+const chunks = await splitter.splitText(text);
+```
+
+### Embeddings
+
+Use `OpenAIEmbeddingModel` to generate embeddings for your text.
+
+```typescript
+import { OpenAIEmbeddingModel } from "@voltagent/documents";
+
+const embedder = new OpenAIEmbeddingModel({
+  apiKey: process.env.OPENAI_API_KEY, // Optional if set in env
+  model: "text-embedding-ada-002", // Default
+});
+
+const embedding = await embedder.embedQuery("Hello world");
+```
+
+### Document Processor
+
+The `DocumentProcessor` combines splitting and embedding.
+
+```typescript
+import { DocumentProcessor } from "@voltagent/documents";
+
+const processor = new DocumentProcessor();
+// Or with custom splitter/embedder:
+// const processor = new DocumentProcessor(uniqueSplitter, uniqueEmbedder);
+
+const documents = await processor.process("Long text content...", {
+  source: "example.txt",
+  author: "Me",
+});
+
+/*
+Returns:
+[
+  {
+    text: "chunk 1...",
+    embedding: [0.123, ...],
+    metadata: { source: "example.txt", author: "Me", chunkIndex: 0, ... }
+  },
+  ...
+]
+*/
+```
diff --git a/packages/documents/package.json b/packages/documents/package.json
new file mode 100644
index 000000000..48cde0223
--- /dev/null
+++ b/packages/documents/package.json
@@ -0,0 +1,38 @@
+{
+    "name": "@voltagent/documents",
+    "version": "0.0.1",
+    "description": "Document processing and embedding utilities for VoltAgent",
+    "main": "dist/index.js",
+    "module": "dist/index.mjs",
+    "types": "dist/index.d.ts",
+    "exports": {
+        ".": {
+            "import": {
+                "types": "./dist/index.d.mts",
+                "default": "./dist/index.mjs"
+            },
+            "require": {
+                "types": "./dist/index.d.ts",
+                "default": "./dist/index.js"
+            }
+        }
+    },
+    "files": [
+        "dist"
+    ],
+    "scripts": {
+        "build": "tsup",
+        "dev": "tsup --watch",
+        "typecheck": "tsc --noEmit",
+        "test": "vitest run"
+    },
+    "dependencies": {
+        "openai": "^4.20.0"
+    },
+    "devDependencies": {
+        "tsup": "^8.5.0",
+        "typescript": "^5.8.2",
+        "vitest": "^3.2.4",
+        "@types/node": "^24.2.1"
+    }
+}
\ No newline at end of file
diff --git a/packages/documents/src/DocumentProcessor.test.ts b/packages/documents/src/DocumentProcessor.test.ts
new file mode 100644
index 000000000..d1364e9ee
--- /dev/null
+++ b/packages/documents/src/DocumentProcessor.test.ts
@@ -0,0 +1,44 @@
+import { describe, expect, it } from "vitest";
+import { DocumentProcessor } from "./DocumentProcessor";
+import type { EmbeddingModel } from "./embeddings/EmbeddingModel";
+import { TextSplitter } from "./text-splitters/TextSplitter";
+
+class MockSplitter extends TextSplitter {
+  async splitText(text: string): Promise<string[]> {
+    return text.split("|");
+  }
+}
+
+class MockEmbedder implements EmbeddingModel {
+  async embedQuery(_text: string): Promise<number[]> {
+    return [0.1, 0.2];
+  }
+  async embedDocuments(documents: string[]): Promise<number[][]> {
+    return documents.map(() => [0.1, 0.2]);
+  }
+}
+
+describe("DocumentProcessor", () => {
+  it("processes text into documents with embeddings", async () => {
+    const processor = new DocumentProcessor(new MockSplitter(), new MockEmbedder());
+    const result = await processor.process("part1|part2", { file: "test.txt" });
+
+    expect(result).toHaveLength(2);
+
+    expect(result[0].text).toBe("part1");
+    expect(result[0].embedding).toEqual([0.1, 0.2]);
+    expect(result[0].metadata).toEqual({
+      file: "test.txt",
+      chunkIndex: 0,
+      chunkCount: 2,
+    });
+
+    expect(result[1].text).toBe("part2");
+    expect(result[1].embedding).toEqual([0.1, 0.2]);
+    expect(result[1].metadata).toEqual({
+      file: "test.txt",
+      chunkIndex: 1,
+      chunkCount: 2,
+    });
+  });
+});
diff --git a/packages/documents/src/DocumentProcessor.ts b/packages/documents/src/DocumentProcessor.ts
new file mode 100644
index 000000000..361d37426
--- /dev/null
+++ b/packages/documents/src/DocumentProcessor.ts
@@ -0,0 +1,35 @@
+import type { EmbeddingModel } from "./embeddings/EmbeddingModel";
+import { OpenAIEmbeddingModel } from "./embeddings/OpenAIEmbeddingModel";
+import { RecursiveCharacterTextSplitter } from "./text-splitters/RecursiveCharacterTextSplitter";
+import type { TextSplitter } from "./text-splitters/TextSplitter";
+
+export interface ProcessedDocument {
+  text: string;
+  embedding: number[];
+  metadata?: Record<string, any>;
+}
+
+export class DocumentProcessor {
+  splitter: TextSplitter;
+  embedder: EmbeddingModel;
+
+  constructor(splitter?: TextSplitter, embedder?: EmbeddingModel) {
+    this.splitter = splitter ?? new RecursiveCharacterTextSplitter();
+    this.embedder = embedder ?? new OpenAIEmbeddingModel();
+  }
+
+  async process(text: string, metadata?: Record<string, any>): Promise<ProcessedDocument[]> {
+    const chunks = await this.splitter.splitText(text);
+    const embeddings = await this.embedder.embedDocuments(chunks);
+
+    return chunks.map((chunk, index) => ({
+      text: chunk,
+      embedding: embeddings[index],
+      metadata: {
+        ...metadata,
+        chunkIndex: index,
+        chunkCount: chunks.length,
+      },
+    }));
+  }
+}
diff --git a/packages/documents/src/RecursiveCharacterTextSplitter.test.ts b/packages/documents/src/RecursiveCharacterTextSplitter.test.ts
new file mode 100644
index 000000000..2110b710c
--- /dev/null
+++ b/packages/documents/src/RecursiveCharacterTextSplitter.test.ts
@@ -0,0 +1,76 @@
+import { describe, expect, it } from "vitest";
+import { RecursiveCharacterTextSplitter } from "./text-splitters/RecursiveCharacterTextSplitter";
+
+describe("RecursiveCharacterTextSplitter", () => {
+  it("splits text based on characters", async () => {
+    const splitter = new RecursiveCharacterTextSplitter({
+      chunkSize: 10,
+      chunkOverlap: 0,
+    });
+    const text = "abcdefghijklmnopqrstuvwxyz";
+    const chunks = await splitter.splitText(text);
+    // Expect chunks to be size 10 -> "abcdefghij", "klmnopqrst", "uvwxyz"
+    expect(chunks).toEqual(["abcdefghij", "klmnopqrst", "uvwxyz"]);
+  });
+
+  it("splits text with simple separator", async () => {
+    const splitter = new RecursiveCharacterTextSplitter({
+      chunkSize: 10,
+      chunkOverlap: 0,
+      separators: [" "],
+    });
+    const text = "hello world how are you";
+    // "hello world" is 11 chars > 10.
+    // "hello" (5)
+    // "world" (5)
+    // "how" (3)
+    // "are" (3)
+    // "you" (3)
+    // "how are you" -> 3+1+3+1+3 = 11 > 10.
+    // So "how are" (7)
+    // "you" (3)
+    const chunks = await splitter.splitText(text);
+    // My implementation logic:
+    // split by " ". -> ["hello", "world", "how", "are", "you"]
+    // "hello" -> current.
+    // "world" -> len 5. "hello" + 1 + "world" = 11 > 10. Flush "hello". current="world".
+    // "how" -> len 3. "world" + 1 + "how" = 9 <= 10. current="world how".
+    // "are" -> len 3. "world how" + 1 + "are" = 9+1+3=13 > 10. Flush "world how". current="are".
+    // "you" -> len 3. "are" + 1 + "you" = 7 <= 10. current="are you".
+    // Flush "are you".
+
+    expect(chunks).toEqual(["hello", "world how", "are you"]);
+  });
+
+  it("handles recursion with multiple separators", async () => {
+    // This tests the recursion logic
+    const splitter = new RecursiveCharacterTextSplitter({
+      chunkSize: 20,
+      chunkOverlap: 0,
+      separators: ["\n", " "],
+    });
+    // "Para1 word word word" -> 20 chars
+    const text = "Para1 is longer than 20 chars\nPara2 is short";
+    const chunks = await splitter.splitText(text);
+
+    // Split by \n:
+    // "Para1 is longer than 20 chars" (29 chars) -> Too big -> Recurse with [" "]
+    // "Para2 is short" (14 chars) -> Fits.
+
+    // Recursion on "Para1...":
+    // Split by " ": "Para1", "is", "longer", "than", "20", "chars"
+    // Accumulate:
+    // "Para1 is" (8)
+    // + "longer" (6) -> "Para1 is longer" (15)
+    // + "than" (4) -> "Para1 is longer than" (20) -> Perfect fit? (15+1+4=20). Yes.
+    // + "20" (2) -> "Para1 is longer than 20" (23) -> Flush "Para1 is longer than". Current="20".
+    // "chars" -> "20 chars" (8).
+
+    // So result should be:
+    // "Para1 is longer than"
+    // "20 chars"
+    // "Para2 is short"
+
+    expect(chunks).toEqual(["Para1 is longer than", "20 chars", "Para2 is short"]);
+  });
+});
diff --git a/packages/documents/src/embeddings/EmbeddingModel.ts b/packages/documents/src/embeddings/EmbeddingModel.ts
new file mode 100644
index 000000000..80f10cfb8
--- /dev/null
+++ b/packages/documents/src/embeddings/EmbeddingModel.ts
@@ -0,0 +1,4 @@
+export interface EmbeddingModel {
+  embedQuery(text: string): Promise<number[]>;
+  embedDocuments(documents: string[]): Promise<number[][]>;
+}
diff --git a/packages/documents/src/embeddings/OpenAIEmbeddingModel.ts b/packages/documents/src/embeddings/OpenAIEmbeddingModel.ts
new file mode 100644
index 000000000..b3d30b16f
--- /dev/null
+++ b/packages/documents/src/embeddings/OpenAIEmbeddingModel.ts
@@ -0,0 +1,49 @@
+import { OpenAI } from "openai";
+import type { EmbeddingModel } from "./EmbeddingModel";
+
+export interface OpenAIEmbeddingModelParams {
+  apiKey?: string;
+  model?: string;
+  maxBatchSize?: number;
+}
+
+export class OpenAIEmbeddingModel implements EmbeddingModel {
+  private client: OpenAI;
+  private model: string;
+  private maxBatchSize: number;
+
+  constructor(params?: OpenAIEmbeddingModelParams) {
+    this.client = new OpenAI({
+      apiKey: params?.apiKey ?? process.env.OPENAI_API_KEY,
+    });
+    this.model = params?.model ?? "text-embedding-ada-002";
+    this.maxBatchSize = params?.maxBatchSize ?? 512;
+  }
+
+  async embedQuery(text: string): Promise<number[]> {
+    const response = await this.client.embeddings.create({
+      model: this.model,
+      input: text.replace(/\n/g, " "),
+    });
+    return response.data[0].embedding;
+  }
+
+  async embedDocuments(documents: string[]): Promise<number[][]> {
+    const embeddings: number[][] = [];
+
+    for (let i = 0; i < documents.length; i += this.maxBatchSize) {
+      const batch = documents.slice(i, i + this.maxBatchSize).map((d) => d.replace(/\n/g, " "));
+      if (batch.length === 0) continue;
+
+      const response = await this.client.embeddings.create({
+        model: this.model,
+        input: batch,
+      });
+
+      const sortedData = response.data.sort((a, b) => a.index - b.index);
+      embeddings.push(...sortedData.map((item) => item.embedding));
+    }
+
+    return embeddings;
+  }
+}
diff --git a/packages/documents/src/index.ts b/packages/documents/src/index.ts
new file mode 100644
index 000000000..be2278204
--- /dev/null
+++ b/packages/documents/src/index.ts
@@ -0,0 +1,5 @@
+export * from "./text-splitters/TextSplitter";
+export * from "./text-splitters/RecursiveCharacterTextSplitter";
+export * from "./embeddings/EmbeddingModel";
+export * from "./embeddings/OpenAIEmbeddingModel";
+export * from "./DocumentProcessor";
diff --git a/packages/documents/src/text-splitters/RecursiveCharacterTextSplitter.ts b/packages/documents/src/text-splitters/RecursiveCharacterTextSplitter.ts
new file mode 100644
index 000000000..e1d675310
--- /dev/null
+++ b/packages/documents/src/text-splitters/RecursiveCharacterTextSplitter.ts
@@ -0,0 +1,91 @@
+import { TextSplitter, type TextSplitterParams } from "./TextSplitter";
+
+export interface RecursiveCharacterTextSplitterParams extends TextSplitterParams {
+  separators?: string[];
+}
+
+export class RecursiveCharacterTextSplitter extends TextSplitter {
+  separators: string[];
+
+  constructor(fields?: RecursiveCharacterTextSplitterParams) {
+    super(fields);
+    this.separators = fields?.separators ?? ["\n\n", "\n", " ", ""];
+  }
+
+  async splitText(text: string): Promise<string[]> {
+    return this._splitText(text, this.separators);
+  }
+
+  // biome-ignore lint/complexity/noExcessiveCognitiveComplexity: recursive splitting logic is complex
+  private _splitText(text: string, separators: string[]): string[] {
+    const finalChunks: string[] = [];
+
+    let separator = separators[separators.length - 1];
+    let newSeparators: string[] = []; // Separators to use for recursion
+
+    for (let i = 0; i < separators.length; i++) {
+      const s = separators[i];
+      if (s === "") {
+        separator = s;
+        break;
+      }
+      if (text.includes(s)) {
+        separator = s;
+        newSeparators = separators.slice(i + 1);
+        break;
+      }
+    }
+
+    const splits = separator ? text.split(separator) : text.split("");
+    let currentDoc: string[] = [];
+    let total = 0;
+
+    for (const split of splits) {
+      const len = split.length;
+      if (len > this.chunkSize && newSeparators.length > 0) {
+        // If a single split is too large, verify if we need to flush what we have so far
+        if (currentDoc.length > 0) {
+          finalChunks.push(currentDoc.join(separator));
+          // Reset currentDoc, naive overlap handling for mixed recursion cases: just clear
+          currentDoc = [];
+          total = 0;
+        }
+
+        // Recurse on the large split
+        const recursionDocs = this._splitText(split, newSeparators);
+        finalChunks.push(...recursionDocs);
+      } else {
+        // Check if adding this split would exceed chunk size
+        if (total + len + (currentDoc.length > 0 ? separator.length : 0) > this.chunkSize) {
+          if (currentDoc.length > 0) {
+            finalChunks.push(currentDoc.join(separator));
+
+            // Prune from start to maintain overlap
+            // We remove items until the remaining total is <= chunkOverlap
+            // Note: This logic is approximate.
+            while (
+              total > this.chunkOverlap ||
+              (total + len + (currentDoc.length > 0 ? separator.length : 0) > this.chunkSize &&
+                currentDoc.length > 0)
+            ) {
+              const first = currentDoc.shift();
+              if (first) {
+                total -= first.length + (currentDoc.length > 0 ? separator.length : 0);
+              } else {
+                break;
+              }
+            }
+          }
+        }
+        currentDoc.push(split);
+        total += len + (currentDoc.length > 1 ? separator.length : 0);
+      }
+    }
+
+    if (currentDoc.length > 0) {
+      finalChunks.push(currentDoc.join(separator));
+    }
+
+    return finalChunks;
+  }
+}
diff --git a/packages/documents/src/text-splitters/TextSplitter.ts b/packages/documents/src/text-splitters/TextSplitter.ts
new file mode 100644
index 000000000..7f7d9aef7
--- /dev/null
+++ b/packages/documents/src/text-splitters/TextSplitter.ts
@@ -0,0 +1,37 @@
+export interface TextSplitterParams {
+  chunkSize?: number;
+  chunkOverlap?: number;
+}
+
+export abstract class TextSplitter {
+  chunkSize: number;
+  chunkOverlap: number;
+
+  constructor(fields?: TextSplitterParams) {
+    this.chunkSize = fields?.chunkSize ?? 1000;
+    this.chunkOverlap = fields?.chunkOverlap ?? 200;
+
+    if (this.chunkSize <= 0) {
+      throw new Error(`chunkSize must be a positive number, but got ${this.chunkSize}`);
+    }
+
+    if (this.chunkOverlap < 0) {
+      throw new Error(`chunkOverlap must be non-negative, but got ${this.chunkOverlap}`);
+    }
+
+    if (this.chunkOverlap >= this.chunkSize) {
+      throw new Error("Chunk overlap must be less than chunk size");
+    }
+  }
+
+  abstract splitText(text: string): Promise<string[]>;
+
+  async createDocuments(texts: string[]): Promise<string[]> {
+    const documents: string[] = [];
+    for (const text of texts) {
+      const chunks = await this.splitText(text);
+      documents.push(...chunks);
+    }
+    return documents;
+  }
+}
diff --git a/packages/documents/tsconfig.json b/packages/documents/tsconfig.json
new file mode 100644
index 000000000..c333ab017
--- /dev/null
+++ b/packages/documents/tsconfig.json
@@ -0,0 +1,30 @@
+{
+  "compilerOptions": {
+    "target": "ES2022",
+    "lib": ["dom", "dom.iterable", "esnext"],
+    "module": "esnext",
+    "moduleResolution": "bundler",
+    "declaration": true,
+    "declarationMap": true,
+    "sourceMap": true,
+    "outDir": "./dist",
+    "rootDir": "./",
+    "strict": true,
+    "noImplicitAny": true,
+    "strictNullChecks": true,
+    "strictFunctionTypes": true,
+    "strictBindCallApply": true,
+    "strictPropertyInitialization": true,
+    "noImplicitThis": true,
+    "noUnusedLocals": true,
+    "noUnusedParameters": true,
+    "noImplicitReturns": true,
+    "noFallthroughCasesInSwitch": true,
+    "esModuleInterop": true,
+    "skipLibCheck": true,
+    "forceConsistentCasingInFileNames": true,
+    "types": ["vitest/globals", "node"]
+  },
+  "include": ["src/**/*.ts"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/documents/tsup.config.ts b/packages/documents/tsup.config.ts
new file mode 100644
index 000000000..0819104fd
--- /dev/null
+++ b/packages/documents/tsup.config.ts
@@ -0,0 +1,19 @@
+import { defineConfig } from "tsup";
+import { markAsExternalPlugin } from "../shared/tsup-plugins/mark-as-external";
+
+export default defineConfig({
+  entry: ["src/index.ts"],
+  format: ["cjs", "esm"],
+  splitting: false,
+  sourcemap: true,
+  clean: false,
+  target: "es2022",
+  outDir: "dist",
+  minify: false,
+  dts: true,
+  esbuildPlugins: [markAsExternalPlugin],
+  esbuildOptions(options) {
+    options.keepNames = true;
+    return options;
+  },
+});
diff --git a/packages/server-core/src/websocket/setup.ts b/packages/server-core/src/websocket/setup.ts
index cfca7e329..1968a288d 100644
--- a/packages/server-core/src/websocket/setup.ts
+++ b/packages/server-core/src/websocket/setup.ts
@@ -229,6 +229,7 @@ export function setupWebSocketUpgrade(
   auth?: AuthProvider<any> | AuthNextConfig<any>,
   logger?: Logger,
 ): void {
+  // biome-ignore lint/complexity/noExcessiveCognitiveComplexity: legacy complexity allowed
   server.addListener("upgrade", async (req: IncomingMessage, socket: Socket, head: Buffer) => {
     const url = new URL(req.url || "", "http://localhost");
     const path = url.pathname;
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index 4562a5bf1..a8dab3542 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -3745,6 +3745,9 @@ importers:
       '@opentelemetry/semantic-conventions':
         specifier: ^1.28.0
         version: 1.36.0
+      '@voltagent/documents':
+        specifier: workspace:*
+        version: link:../documents
       '@voltagent/internal':
         specifier: ^1.0.2
         version: link:../internal
@@ -3880,6 +3883,25 @@ importers:
         specifier: ^4.1.11
         version: 4.1.11
 
+  packages/documents:
+    dependencies:
+      openai:
+        specifier: ^4.20.0
+        version: 4.104.0(ws@8.18.3)(zod@3.25.76)
+    devDependencies:
+      '@types/node':
+        specifier: ^24.2.1
+        version: 24.6.2
+      tsup:
+        specifier: ^8.5.0
+        version: 8.5.0(@swc/core@1.5.29)(typescript@5.9.3)
+      typescript:
+        specifier: ^5.8.2
+        version: 5.9.3
+      vitest:
+        specifier: ^3.2.4
+        version: 3.2.4(@types/node@24.6.2)(@vitest/ui@1.6.1)(jsdom@22.1.0)
+
   packages/evals:
     dependencies:
       '@voltagent/internal':
@@ -10728,6 +10750,7 @@ packages:
     dependencies:
       '@cfworker/json-schema': 4.1.1
       ansi-styles: 5.2.0
+      apache-arrow: 18.1.0
       camelcase: 6.3.0
       decamelize: 1.2.0
       js-tiktoken: 1.0.21
@@ -10735,9 +10758,18 @@ packages:
       mustache: 4.2.0
       p-queue: 6.6.2
       p-retry: 4.6.2
+      reflect-metadata: 0.2.2
       uuid: 10.0.0
       zod: 3.25.76
       zod-to-json-schema: 3.25.0(zod@3.25.76)
+    optionalDependencies:
+      '@lancedb/lancedb-darwin-arm64': 0.23.0
+      '@lancedb/lancedb-linux-arm64-gnu': 0.23.0
+      '@lancedb/lancedb-linux-arm64-musl': 0.23.0
+      '@lancedb/lancedb-linux-x64-gnu': 0.23.0
+      '@lancedb/lancedb-linux-x64-musl': 0.23.0
+      '@lancedb/lancedb-win32-arm64-msvc': 0.23.0
+      '@lancedb/lancedb-win32-x64-msvc': 0.23.0
     transitivePeerDependencies:
       - '@opentelemetry/api'
       - '@opentelemetry/exporter-trace-otlp-proto'
@@ -16592,13 +16624,8 @@ packages:
     resolution: {integrity: sha512-vENRlFU4YbrwVqNDZ7fLvy+JR1CRkyr01jhSiDpE1u6py3OMzQfztQU2jxykW3ALNxO4kSlqIDeYyD0Y9RcQeQ==}
     dev: true
 
-  /@rolldown/pluginutils@1.0.0-beta.58:
-    resolution: {integrity: sha512-qWhDs6yFGR5xDfdrwiSa3CWGIHxD597uGE/A9xGqytBjANvh4rLCTTkq7szhMV4+Ygh+PMS90KVJ8xWG/TkX4w==}
-    dev: false
-
   /@rolldown/pluginutils@1.0.0-beta.59:
     resolution: {integrity: sha512-aoh6LAJRyhtazs98ydgpNOYstxUlsOV1KJXcpf/0c0vFcUA8uyd/hwKRhqE/AAPNqAho9RliGsvitCoOzREoVA==}
-    dev: true
 
   /@rollup/plugin-alias@5.1.1(rollup@4.50.2):
     resolution: {integrity: sha512-PR9zDb+rOzkRb2VD+EuKB7UC41vU5DIwZ5qqCpk0KJudcWAyi8rvYOhS7+L5aZCspw1stTViLgN5v6FF1p5cgQ==}
@@ -19981,7 +20008,7 @@ packages:
       '@babel/core': 7.28.5
       '@babel/plugin-syntax-typescript': 7.27.1(@babel/core@7.28.5)
       '@babel/plugin-transform-typescript': 7.28.0(@babel/core@7.28.5)
-      '@rolldown/pluginutils': 1.0.0-beta.58
+      '@rolldown/pluginutils': 1.0.0-beta.59
       '@vue/babel-plugin-jsx': 1.5.0(@babel/core@7.28.5)
       vite: 7.2.7(@types/node@24.2.1)(jiti@2.6.1)
       vue: 3.5.22(typescript@5.9.3)
@@ -37892,6 +37919,51 @@ packages:
       - yaml
     dev: true
 
+  /tsup@8.5.0(@swc/core@1.5.29)(typescript@5.9.3):
+    resolution: {integrity: sha512-VmBp77lWNQq6PfuMqCHD3xWl22vEoWsKajkF8t+yMBawlUS8JzEI+vOVMeuNZIuMML8qXRizFKi9oD5glKQVcQ==}
+    engines: {node: '>=18'}
+    hasBin: true
+    peerDependencies:
+      '@microsoft/api-extractor': ^7.36.0
+      '@swc/core': ^1
+      postcss: ^8.4.12
+      typescript: '>=4.5.0'
+    peerDependenciesMeta:
+      '@microsoft/api-extractor':
+        optional: true
+      '@swc/core':
+        optional: true
+      postcss:
+        optional: true
+      typescript:
+        optional: true
+    dependencies:
+      '@swc/core': 1.5.29(@swc/helpers@0.5.17)
+      bundle-require: 5.1.0(esbuild@0.25.10)
+      cac: 6.7.14
+      chokidar: 4.0.3
+      consola: 3.4.2
+      debug: 4.4.3(supports-color@10.2.2)
+      esbuild: 0.25.10
+      fix-dts-default-cjs-exports: 1.0.1
+      joycon: 3.1.1
+      picocolors: 1.1.1
+      postcss-load-config: 6.0.1
+      resolve-from: 5.0.0
+      rollup: 4.50.2
+      source-map: 0.8.0-beta.0
+      sucrase: 3.35.0
+      tinyexec: 0.3.2
+      tinyglobby: 0.2.15
+      tree-kill: 1.2.2
+      typescript: 5.9.3
+    transitivePeerDependencies:
+      - jiti
+      - supports-color
+      - tsx
+      - yaml
+    dev: true
+
   /tsx@4.20.4:
     resolution: {integrity: sha512-yyxBKfORQ7LuRt/BQKBXrpcq59ZvSW0XxwfjAt3w2/8PmdxaFzijtMhTawprSHhpzeM5BgU2hXHG3lklIERZXg==}
     engines: {node: '>=18.0.0'}
@@ -39212,6 +39284,31 @@ packages:
       - yaml
     dev: false
 
+  /vite-node@3.2.4(@types/node@24.6.2):
+    resolution: {integrity: sha512-EbKSKh+bh1E1IFxeO0pg1n4dvoOTt0UDiXMd/qn++r98+jPO1xtJilvXldeuQ8giIB5IkpjCgMleHMNEsGH6pg==}
+    engines: {node: ^18.0.0 || ^20.0.0 || >=22.0.0}
+    hasBin: true
+    dependencies:
+      cac: 6.7.14
+      debug: 4.4.3(supports-color@10.2.2)
+      es-module-lexer: 1.7.0
+      pathe: 2.0.3
+      vite: 7.2.7(@types/node@24.6.2)
+    transitivePeerDependencies:
+      - '@types/node'
+      - jiti
+      - less
+      - lightningcss
+      - sass
+      - sass-embedded
+      - stylus
+      - sugarss
+      - supports-color
+      - terser
+      - tsx
+      - yaml
+    dev: true
+
   /vite-plugin-checker@0.11.0(@biomejs/biome@1.9.4)(eslint@9.33.0)(typescript@5.9.3)(vite@7.2.7):
     resolution: {integrity: sha512-iUdO9Pl9UIBRPAragwi3as/BXXTtRu4G12L3CMrjx+WVTd9g/MsqNakreib9M/2YRVkhZYiTEwdH2j4Dm0w7lw==}
     engines: {node: '>=16.11'}
@@ -39407,6 +39504,57 @@ packages:
       fsevents: 2.3.3
     dev: false
 
+  /vite@7.2.7(@types/node@24.6.2):
+    resolution: {integrity: sha512-ITcnkFeR3+fI8P1wMgItjGrR10170d8auB4EpMLPqmx6uxElH3a/hHGQabSHKdqd4FXWO1nFIp9rRn7JQ34ACQ==}
+    engines: {node: ^20.19.0 || >=22.12.0}
+    hasBin: true
+    peerDependencies:
+      '@types/node': ^20.19.0 || >=22.12.0
+      jiti: '>=1.21.0'
+      less: ^4.0.0
+      lightningcss: ^1.21.0
+      sass: ^1.70.0
+      sass-embedded: ^1.70.0
+      stylus: '>=0.54.8'
+      sugarss: ^5.0.0
+      terser: ^5.16.0
+      tsx: ^4.8.1
+      yaml: ^2.4.2
+    peerDependenciesMeta:
+      '@types/node':
+        optional: true
+      jiti:
+        optional: true
+      less:
+        optional: true
+      lightningcss:
+        optional: true
+      sass:
+        optional: true
+      sass-embedded:
+        optional: true
+      stylus:
+        optional: true
+      sugarss:
+        optional: true
+      terser:
+        optional: true
+      tsx:
+        optional: true
+      yaml:
+        optional: true
+    dependencies:
+      '@types/node': 24.6.2
+      esbuild: 0.25.10
+      fdir: 6.5.0(picomatch@4.0.3)
+      picomatch: 4.0.3
+      postcss: 8.5.6
+      rollup: 4.50.2
+      tinyglobby: 0.2.15
+    optionalDependencies:
+      fsevents: 2.3.3
+    dev: true
+
   /vitefu@1.1.1(vite@7.2.7):
     resolution: {integrity: sha512-B/Fegf3i8zh0yFbpzZ21amWzHmuNlLlmJT6n7bu5e+pCHUKQIfXSYokrqOBGEMMe9UG2sostKQF9mml/vYaWJQ==}
     peerDependencies:
@@ -39487,6 +39635,75 @@ packages:
       - yaml
     dev: true
 
+  /vitest@3.2.4(@types/node@24.6.2)(@vitest/ui@1.6.1)(jsdom@22.1.0):
+    resolution: {integrity: sha512-LUCP5ev3GURDysTWiP47wRRUpLKMOfPh+yKTx3kVIEiu5KOMeqzpnYNsKyOoVrULivR8tLcks4+lga33Whn90A==}
+    engines: {node: ^18.0.0 || ^20.0.0 || >=22.0.0}
+    hasBin: true
+    peerDependencies:
+      '@edge-runtime/vm': '*'
+      '@types/debug': ^4.1.12
+      '@types/node': ^18.0.0 || ^20.0.0 || >=22.0.0
+      '@vitest/browser': 3.2.4
+      '@vitest/ui': 3.2.4
+      happy-dom: '*'
+      jsdom: '*'
+    peerDependenciesMeta:
+      '@edge-runtime/vm':
+        optional: true
+      '@types/debug':
+        optional: true
+      '@types/node':
+        optional: true
+      '@vitest/browser':
+        optional: true
+      '@vitest/ui':
+        optional: true
+      happy-dom:
+        optional: true
+      jsdom:
+        optional: true
+    dependencies:
+      '@types/chai': 5.2.2
+      '@types/node': 24.6.2
+      '@vitest/expect': 3.2.4
+      '@vitest/mocker': 3.2.4(msw@2.11.6)(vite@7.2.7)
+      '@vitest/pretty-format': 3.2.4
+      '@vitest/runner': 3.2.4
+      '@vitest/snapshot': 3.2.4
+      '@vitest/spy': 3.2.4
+      '@vitest/ui': 1.6.1(vitest@3.2.4)
+      '@vitest/utils': 3.2.4
+      chai: 5.2.1
+      debug: 4.4.3(supports-color@10.2.2)
+      expect-type: 1.2.2
+      jsdom: 22.1.0
+      magic-string: 0.30.19
+      pathe: 2.0.3
+      picomatch: 4.0.3
+      std-env: 3.9.0
+      tinybench: 2.9.0
+      tinyexec: 0.3.2
+      tinyglobby: 0.2.15
+      tinypool: 1.1.1
+      tinyrainbow: 2.0.0
+      vite: 7.2.7(@types/node@24.6.2)
+      vite-node: 3.2.4(@types/node@24.6.2)
+      why-is-node-running: 2.3.0
+    transitivePeerDependencies:
+      - jiti
+      - less
+      - lightningcss
+      - msw
+      - sass
+      - sass-embedded
+      - stylus
+      - sugarss
+      - supports-color
+      - terser
+      - tsx
+      - yaml
+    dev: true
+
   /viteval@0.5.3(@tanstack/query-core@5.89.0)(@tanstack/react-query@5.89.0)(@tanstack/router-core@1.131.44)(@types/node@24.2.1)(@types/react@19.2.7)(@vitejs/plugin-react@5.1.2)(tsx@4.20.4)(vite@7.2.7):
     resolution: {integrity: sha512-phDrceVUtOje90Oy0v0jeSuAC1FxGrho34KGUntUs9ZG5nJe+CZt59YykasOPdLv0HA5oQgRAkOY2xUvwmaRag==}
     hasBin: true
diff --git a/website/docs/rag/overview.md b/website/docs/rag/overview.md
index 6c04de785..419a1759a 100644
--- a/website/docs/rag/overview.md
+++ b/website/docs/rag/overview.md
@@ -239,3 +239,42 @@ npm create voltagent-app@latest -- --example with-lancedb
 **I want to see examples** → [GitHub Examples](https://github.com/voltagent/voltagent/tree/main/examples)
 
 **I need help choosing** → Join our [Discord](https://s.voltagent.dev/discord) and ask!
+
+## Advanced Chunking
+
+For more control over how your documents are processed, VoltAgent provides a dedicated package `@voltagent/rag` with advanced chunking strategies.
+
+### Installation
+
+```bash
+npm install @voltagent/rag
+```
+
+### Available Chunkers
+
+The package includes several specialized chunkers optimized for different content types:
+
+- **RecursiveChunker**: Best for general text (keeps related context together)
+- **MarkdownChunker**: Preserves markdown structure (headers, lists, code blocks)
+- **SemanticChunker**: Uses embeddings to split text by meaning
+- **CodeChunker**: Optimized for splitting source code
+- **TokenChunker**: Fixed-size token windows
+
+### Example Usage
+
+```typescript
+import { RecursiveChunker, MarkdownChunker } from "@voltagent/rag";
+
+// 1. Recursive Chunking (Recommended for text)
+const textChunker = new RecursiveChunker();
+const textChunks = textChunker.chunk(longDocument, {
+  maxTokens: 500,
+  overlapTokens: 50,
+});
+
+// 2. Markdown Chunking (Recommended for documentation)
+const mdChunker = new MarkdownChunker();
+const mdChunks = mdChunker.chunk(markdownContent, {
+  maxTokens: 1000,
+});
+```