61 lines
1.7 KiB
Python
61 lines
1.7 KiB
Python
"""
|
|
FastAPI server for Local RAG with chat GUI.
|
|
Run with: uvicorn server:app --reload
|
|
"""
|
|
from pathlib import Path
|
|
|
|
from fastapi import FastAPI, HTTPException
|
|
from fastapi.responses import HTMLResponse
|
|
from pydantic import BaseModel
|
|
|
|
from local_rag import LocalRAG
|
|
|
|
# Initialize RAG once at startup
|
|
VECTORSTORE_PATH = "./vectorstore"
|
|
OLLAMA_MODEL = "mistral:7b"
|
|
rag = LocalRAG(vectorstore_path=VECTORSTORE_PATH, ollama_model=OLLAMA_MODEL)
|
|
|
|
app = FastAPI(title="Local RAG Chat", version="1.0.0")
|
|
|
|
|
|
class ChatRequest(BaseModel):
|
|
message: str
|
|
|
|
|
|
class ChatResponse(BaseModel):
|
|
answer: str
|
|
error: str | None = None
|
|
|
|
|
|
@app.get("/", response_class=HTMLResponse)
|
|
def chat_view():
|
|
"""Serve the chat GUI."""
|
|
html_path = Path(__file__).parent / "templates" / "chat.html"
|
|
if not html_path.exists():
|
|
raise HTTPException(status_code=500, detail="Chat template not found")
|
|
return HTMLResponse(content=html_path.read_text(encoding="utf-8"))
|
|
|
|
|
|
@app.post("/api/chat", response_model=ChatResponse)
|
|
def chat(request: ChatRequest):
|
|
"""Handle a chat message and return the RAG answer."""
|
|
if not request.message or not request.message.strip():
|
|
return ChatResponse(answer="", error="Message cannot be empty")
|
|
try:
|
|
answer = rag.query(request.message.strip())
|
|
return ChatResponse(answer=answer)
|
|
except Exception as e:
|
|
return ChatResponse(answer="", error=str(e))
|
|
|
|
|
|
@app.get("/api/health")
|
|
def health():
|
|
"""Health check and vector store status."""
|
|
has_docs = rag.vectorstore is not None
|
|
return {"status": "ok", "vectorstore_loaded": has_docs}
|
|
|
|
|
|
if __name__ == "__main__":
|
|
import uvicorn
|
|
uvicorn.run(app, host="0.0.0.0", port=8000)
|