test RAG with local Ollama models

initial commit
2026-01-26 19:49:02 +01:00
commit b1405f3b84
4 changed files with 250 additions and 0 deletions
@@ -0,0 +1,25 @@
+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+venv/
+env/
+ENV/
+
+# Vector store
+vectorstore/
+
+# Uploads
+uploads/
+
+# IDE
+.vscode/
+.idea/
+*.swp
+*.swo
+
+# OS
+.DS_Store
+Thumbs.db
@@ -0,0 +1,65 @@
+# Local RAG Setup
+
+Minimal RAG implementation with LangChain, Ollama, and FAISS.
+
+## Dependencies
+
+Only 5 packages:
+- `langchain` - Core framework
+- `langchain-ollama` - Ollama integration
+- `faiss-cpu` - Vector search
+- `sentence-transformers` - Embeddings
+- `pypdf` - PDF loading
+
+## Installation
+
+```bash
+# Create conda environment
+conda create -n local_rag python=3.10 -y
+conda activate local_rag
+
+# Install dependencies
+pip install -r requirements.txt
+```
+
+## Setup Ollama
+
+```bash
+# Make sure Ollama is running
+ollama serve
+
+# Pull a model (in another terminal)
+ollama pull llama2
+```
+
+## Usage
+
+Edit `local_rag.py` and uncomment the example code:
+
+```python
+# Add documents
+rag.add_documents([
+    "path/to/document1.pdf",
+    "path/to/document2.txt"
+])
+
+# Query
+question = "What is this document about?"
+answer = rag.query(question)
+print(f"Answer: {answer}")
+```
+
+Run:
+```bash
+python local_rag.py
+```
+
+## How it works
+
+1. **Load documents** - PDFs or text files
+2. **Split into chunks** - 1000 chars with 200 overlap
+3. **Create embeddings** - Using sentence-transformers
+4. **Store in FAISS** - Fast similarity search
+5. **Query** - Retrieve relevant chunks and generate answer with Ollama
+
+That's it! Simple and minimal.
@@ -0,0 +1,155 @@
+"""
+Local RAG setup with LangChain, Ollama, and FAISS
+Minimal dependencies, simple code
+"""
+import os
+from pathlib import Path
+from langchain_community.document_loaders import PyPDFLoader, TextLoader
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+from langchain_community.embeddings import HuggingFaceEmbeddings
+from langchain_community.vectorstores import FAISS
+from langchain_ollama import ChatOllama
+
+
+class LocalRAG:
+    def __init__(self, vectorstore_path="./vectorstore", ollama_model="llama2"):
+        """Initialize local RAG system"""
+        self.vectorstore_path = vectorstore_path
+        self.ollama_model = ollama_model
+        
+        # Embeddings
+        print("Loading embeddings model...")
+        self.embeddings = HuggingFaceEmbeddings(
+            model_name="sentence-transformers/all-MiniLM-L6-v2"
+        )
+        
+        # Text splitter
+        self.text_splitter = RecursiveCharacterTextSplitter(
+            chunk_size=1000,
+            chunk_overlap=200
+        )
+        
+        # Ollama LLM
+        print(f"Connecting to Ollama (model: {ollama_model})...")
+        self.llm = ChatOllama(
+            model=ollama_model,
+            base_url="http://localhost:11434"
+        )
+        
+        # Vector store (load if exists, otherwise None)
+        self.vectorstore = None
+        self._load_vectorstore()
+    
+    def _load_vectorstore(self):
+        """Load existing vector store if available"""
+        index_file = os.path.join(self.vectorstore_path, "index.faiss")
+        if os.path.exists(index_file):
+            try:
+                self.vectorstore = FAISS.load_local(
+                    self.vectorstore_path,
+                    self.embeddings,
+                    allow_dangerous_deserialization=True
+                )
+                print(f"Loaded existing vector store from {self.vectorstore_path}")
+            except Exception as e:
+                print(f"Could not load vector store: {e}")
+                self.vectorstore = None
+    
+    def add_documents(self, file_paths):
+        """Add documents to the vector store"""
+        print(f"\nLoading {len(file_paths)} document(s)...")
+        all_docs = []
+        
+        for file_path in file_paths:
+            path = Path(file_path)
+            if not path.exists():
+                print(f"Warning: {file_path} not found, skipping")
+                continue
+            
+            # Load document
+            if path.suffix.lower() == '.pdf':
+                loader = PyPDFLoader(str(path))
+            elif path.suffix.lower() in ['.txt', '.md']:
+                loader = TextLoader(str(path))
+            else:
+                print(f"Warning: Unsupported file type {path.suffix}, skipping")
+                continue
+            
+            docs = loader.load()
+            chunks = self.text_splitter.split_documents(docs)
+            all_docs.extend(chunks)
+            print(f"  - {path.name}: {len(chunks)} chunks")
+        
+        if not all_docs:
+            print("No documents loaded!")
+            return
+        
+        # Create or update vector store
+        print(f"\nCreating embeddings for {len(all_docs)} chunks...")
+        if self.vectorstore is None:
+            self.vectorstore = FAISS.from_documents(all_docs, self.embeddings)
+        else:
+            new_store = FAISS.from_documents(all_docs, self.embeddings)
+            self.vectorstore.merge_from(new_store)
+        
+        # Save
+        os.makedirs(self.vectorstore_path, exist_ok=True)
+        self.vectorstore.save_local(self.vectorstore_path)
+        print(f"Vector store saved to {self.vectorstore_path}")
+    
+    def query(self, question, k=4):
+        """Query the RAG system"""
+        if self.vectorstore is None:
+            return "Error: No documents loaded. Please add documents first."
+        
+        print(f"\nSearching for relevant documents...")
+        docs = self.vectorstore.similarity_search(question, k=k)
+        print(f"Found {len(docs)} relevant documents")
+        
+        # Combine context from documents
+        context = "\n\n".join([doc.page_content for doc in docs])
+        
+        # Create prompt
+        prompt = f"""Use the following context to answer the question.
+If you don't know the answer, say that you don't know instead of making up an answer.
+
+Context:
+{context}
+
+Question: {question}
+
+Answer:"""
+        
+        print("Generating answer with Ollama...")
+        response = self.llm.invoke(prompt)
+        answer = response.content if hasattr(response, 'content') else str(response)
+        
+        return answer
+
+
+def main():
+    """Example usage"""
+    print("=" * 60)
+    print("Local RAG with LangChain, Ollama, and FAISS")
+    print("=" * 60)
+    
+    # Initialize
+    rag = LocalRAG(ollama_model="llama2")
+    
+    # Add documents (uncomment and add your file paths)
+    rag.add_documents([
+         "diverses/local_rag/test1.pdf",
+         "diverses/local_rag/test2.txt"
+    ])
+    
+    # Query
+    # question = "What is this document about?"
+    # answer = rag.query(question)
+    # print(f"\nQuestion: {question}")
+    # print(f"Answer: {answer}")
+    
+    print("\nSetup complete! Uncomment the code above to add documents and query.")
+
+
+if __name__ == "__main__":
+    main()
@@ -0,0 +1,5 @@
+langchain
+langchain-ollama
+faiss-cpu
+sentence-transformers
+pypdf