AI Foundations Archives - Page 4 of 4

Chunking strategies greatly affect RAG quality:

import { RecursiveCharacterTextSplitter } from 'langchain/text_splitter';

// Basic chunking
const splitter = new RecursiveCharacterTextSplitter({
  chunkSize: 1000,
  chunkOverlap: 200,
  separators: ['

', '
', ' ', '']
});

const chunks = await splitter.splitText(document);

Semantic Chunking

async function semanticChunk(text, maxTokens = 500) {
  const sentences = text.match(/[^.!?]+[.!?]+/g) || [text];
  const chunks = [];
  let current = [];
  let tokenCount = 0;

  for (const sentence of sentences) {
    const tokens = sentence.split(/s+/).length; // Approximate
    if (tokenCount + tokens > maxTokens && current.length) {
      chunks.push(current.join(' '));
      current = [];
      tokenCount = 0;
    }
    current.push(sentence);
    tokenCount += tokens;
  }
  if (current.length) chunks.push(current.join(' '));
  return chunks;
}

Best Practices

Chunk size: 500-1000 tokens
Overlap: 10-20% for context
Preserve semantic boundaries

class ConversationManager { constructor(options = {}) { this.maxTokens = options.maxTokens || 4000; this.systemPrompt = options.systemPrompt || 'You are a helpful assistant.'; this.conversations = new Map(); } getHistory(sessionId) { if (!this.conversations.has(sessionId)) { this.conversations.set(sessionId, []); } return this.conversations.get(sessionId); } async chat(sessionId, userMessage) { const history = this.getHistory(sessionId); history.push({ role: 'user', content: userMessage }); // Trim history if too long while (this.estimateTokens(history) > this.maxTokens) { history.shift(); } const response = await openai.chat.completions.create({ model: 'gpt-4', messages: [ { role: 'system', content: this.systemPrompt }, ...history ] }); const reply = response.choices[0].message.content; history.push({ role: 'assistant', content: reply }); return reply; } estimateTokens(messages) { return messages.reduce((sum, m) => sum + m.content.length / 4, 0); } }

Category: AI Foundations

Text Chunking Strategies for RAG Applications

Semantic Chunking

Best Practices

Building Conversational AI with Context Memory in Node.js