# OpenRouter endpoint and API key for LLM calls OPENAI_BASE_URL=https://openrouter.ai/api/v1 OPENAI_API_KEY=sk-or-v1-replace_me # Main LLM used for classification and final answer generation LLM_MODEL=openai/gpt-4.1-mini # Local embedding model for Chroma indexing/search EMBEDDING_MODEL=deepvk/USER2-small EMBEDDING_DEVICE=cpu # Chroma connection settings CHROMA_HOST=chromadb CHROMA_PORT=8000 CHROMA_COLLECTION=law_chunks CHROMA_SSL=false # Retrieval settings RAG_TOP_K=5 FTS_TOP_K=20 VECTOR_TOP_K=20 INDEX_BATCH_SIZE=16 LLM_TIMEOUT_SECONDS=90 # FastAPI bind settings API_HOST=0.0.0.0 API_PORT=8080 LOG_LEVEL=INFO # Background indexing on startup AUTO_INDEX_ON_STARTUP=true AUTO_INDEX_ONLY_IF_EMPTY=true AUTO_INDEX_RESET_COLLECTION=false AUTO_INDEX_RETRY_DELAY_SECONDS=15 AUTO_INDEX_MAX_ATTEMPTS=20