# TDZ C64 Knowledge Base - Environment Configuration
# Last Updated: 2025-12-17
# ============================================================
# Data Storage
# ============================================================
TDZ_DATA_DIR=C:\Users\mit\.tdz-c64-knowledge
# ============================================================
# Search Configuration
# ============================================================
# Enable SQLite FTS5 full-text search (480x faster than BM25)
USE_FTS5=1
# Enable semantic search with embeddings (conceptual search)
USE_SEMANTIC_SEARCH=1
# Sentence-transformers model for semantic search
SEMANTIC_MODEL=all-MiniLM-L6-v2
# Enable BM25 search algorithm (fallback)
USE_BM25=1
# Enable NLTK query preprocessing (stopword removal, stemming)
USE_QUERY_PREPROCESSING=1
# Enable fuzzy search with typo tolerance
USE_FUZZY_SEARCH=1
# Fuzzy search threshold (0-100, default 80%)
FUZZY_THRESHOLD=80
# Search cache configuration
SEARCH_CACHE_SIZE=100
SEARCH_CACHE_TTL=300
# ============================================================
# Feature Toggles
# ============================================================
# Enable OCR for scanned PDFs
USE_OCR=1
# ============================================================
# Security Configuration
# ============================================================
# Comma-separated list of allowed document directories (path traversal protection)
# Leave empty to allow all directories
ALLOWED_DOCS_DIRS=C:\Users\mit\Downloads\tdz-c64-knowledge-input,C:\Users\mit\.tdz-c64-knowledge\scraped_docs
# ============================================================
# LLM Integration (for Smart Auto-Tagging & RAG)
# ============================================================
# LLM Provider: anthropic or openai
LLM_PROVIDER=anthropic
# Anthropic API Key (optional - for RAG features)
# Get your key from: https://console.anthropic.com/
# ANTHROPIC_API_KEY=sk-ant-...
# LLM Model to use
# Anthropic models: claude-3-haiku-20240307, claude-3-5-sonnet-20241022, claude-3-opus-20240229
# OpenAI models: gpt-3.5-turbo, gpt-4, gpt-4-turbo
LLM_MODEL=claude-3-haiku-20240307
# ============================================================
# OCR Configuration (for Poppler - scanned PDF support)
# ============================================================
# Optional: Path to Poppler binary directory (Windows only)
# Download from: https://github.com/oschwartz10612/poppler-windows/releases/
# Example: C:\path\to\poppler-24.08.0\Library\bin
POPPLER_PATH=C:\Users\mit\claude\c64server\tdz-c64-knowledge\poppler-25.12.0\Library\bin