Spaces:
Paused
Paused
| # Core dependencies (updated versions) | |
| python-dotenv>=1.1.1 | |
| pymupdf4llm>=0.0.27 | |
| beautifulsoup4>=4.13.4 | |
| requests>=2.32.4 | |
| pandas>=2.2.3 | |
| openai>=1.99.9 | |
| networkx>=3.5 | |
| numpy>=2.3.1 | |
| scikit-learn>=1.7.1 | |
| streamlit>=1.47.0 | |
| # FastAPI and realtime API dependencies | |
| fastapi>=0.104.0 # For realtime API server | |
| uvicorn[standard]>=0.24.0 # ASGI server for FastAPI | |
| pydantic>=2.4.0 # Data validation and settings management | |
| # Document processing | |
| pymupdf>=1.24.0 # For PDF processing and image extraction | |
| Pillow>=10.0.0 # For image processing | |
| lxml>=5.0.0 # For HTML parsing | |
| html5lib>=1.1 # Alternative HTML parser | |
| # Vector stores and search | |
| faiss-cpu>=1.8.0 # For vector similarity search (use faiss-gpu if CUDA available) | |
| chromadb>=0.5.0 # Alternative vector database | |
| rank-bm25>=0.2.2 # For BM25 keyword search | |
| # Language models and embeddings | |
| sentence-transformers>=3.0.0 # For DPR and cross-encoder | |
| transformers>=4.40.0 # Required by sentence-transformers | |
| torch>=2.0.0 # For neural models (CPU version) | |
| # For GPU support, install separately: | |
| # pip install torch torchvision --index-url https://download.pytorch.org/whl/cu118 | |
| ftfy>=6.1.1 # Text preprocessing for CLIP | |
| regex>=2023.0.0 # Text processing | |
| # For CLIP (optional - enable if needed): | |
| # git+https://github.com/openai/CLIP.git | |
| # Token counting and management | |
| tiktoken>=0.7.0 # For OpenAI token counting | |
| # Database (optional) | |
| # pymongo>=4.0.0 # Uncomment if using MongoDB for metadata | |
| # Development and debugging | |
| tqdm>=4.65.0 # Progress bars | |
| ipython>=8.0.0 # For interactive debugging | |
| jupyter>=1.0.0 # For notebook development | |
| # Data visualization (optional) | |
| matplotlib>=3.7.0 # For plotting | |
| seaborn>=0.12.0 # Statistical visualization | |
| plotly>=5.15.0 # Interactive plots | |
| # Optional advanced features (uncomment if needed) | |
| # langchain>=0.2.11 # For advanced RAG patterns | |
| # langchain-openai>=0.1.20 # OpenAI integration for LangChain | |
| # llama-index>=0.10.51 # Alternative RAG framework | |
| # Additional utility packages | |
| colorama>=0.4.6 # Colored console output | |
| rich>=13.0.0 # Rich text and beautiful formatting in terminal |