Retrieval-Augmented Generation (RAG)

Implementation Example

# A simple Python RAG pipeline
class VectorDatabase:
    def similarity_search(self, query, k=1):
        # Simulated vector search
        return ["Design patterns are reusable solutions to common software problems."]

class LLMClient:
    def generate(self, prompt):
        print(f"Sending prompt to LLM:\n---\n{prompt}\n---")
        return "Based on the context, design patterns are reusable solutions..."

class RAGSystem:
    def __init__(self, db, llm):
        self.db = db
        self.llm = llm

    def query(self, user_prompt):
        # 1. Retrieve context
        context_docs = self.db.similarity_search(user_prompt, k=1)
        context = "\n".join(context_docs)
        
        # 2. Augment prompt
        augmented_prompt = (
            f"Use the following context to answer the question.\n"
            f"Context: {context}\n"
            f"Question: {user_prompt}"
        )
        
        # 3. Generate response
        return self.llm.generate(augmented_prompt)

# Usage
rag = RAGSystem(VectorDatabase(), LLMClient())
print(rag.query("What are design patterns?"))

Retrieval-Augmented Generation (RAG)

Intent & Description

Real-world Use Case

Advantages

Disadvantages