# requirements.txt for Hugging Face Spaces with NVIDIA T4 GPU
# Core Framework Dependencies

# Note: gradio, fastapi, uvicorn, datasets, huggingface-hub, 
# pydantic==2.10.6, and protobuf<4 are installed by HF Spaces SDK

# PyTorch with CUDA support (for GPU inference)
# Note: HF Spaces provides torch, but we ensure GPU support
# Pin to avoid breaking changes with newer versions
torch>=2.0.0,<2.2.0

# Web Framework & Interface
aiohttp>=3.9.0
httpx>=0.25.0

# Hugging Face Ecosystem
# PINNED for Phi-3 and DynamicCache compatibility
# transformers 4.36.0+ has better Phi-3 support, but <4.41.0 to avoid breaking changes
transformers>=4.36.0,<4.41.0
accelerate>=0.24.0,<0.28.0
tokenizers>=0.15.0
sentence-transformers>=2.2.0

# Vector Database & Search
faiss-cpu>=1.7.4
# Pin numpy to avoid compatibility issues with numpy 2.0
numpy>=1.24.0,<2.0.0
scipy>=1.11.0

# Data Processing & Utilities
pandas>=2.1.0
scikit-learn>=1.3.0

# Database & Persistence
sqlalchemy>=2.0.0
alembic>=1.12.0

# Caching & Performance
cachetools>=5.3.0
redis>=5.0.0
python-multipart>=0.0.6

# Security & Validation
pydantic-settings>=2.1.0
python-dotenv>=1.0.0  # For secure .env file loading
python-jose[cryptography]>=3.3.0
bcrypt>=4.0.0

# Mobile Optimization & UI
cssutils>=2.7.0
pillow>=10.1.0
requests>=2.31.0

# Async & Concurrency
aiofiles>=23.2.0
concurrent-log-handler>=0.9.0

# Logging & Monitoring
structlog>=23.2.0
prometheus-client>=0.19.0
psutil>=5.9.0

# Development & Testing
pytest>=7.4.0
pytest-asyncio>=0.21.0
pytest-cov>=4.1.0
black>=23.11.0
flake8>=6.1.0
mypy>=1.7.0

# Utility Libraries
python-dateutil>=2.8.0
pytz>=2023.3
tzdata>=2023.3
ujson>=5.8.0
orjson>=3.9.0

# Flask API for external integrations
flask>=3.0.0
flask-cors>=4.0.0
flask-limiter>=3.5.0  # Rate limiting for API protection

# Production WSGI Server
gunicorn>=21.2.0  # Production WSGI server (replaces Flask dev server)

# HF Spaces Specific Dependencies
# Note: huggingface-cli is part of huggingface-hub (installed by SDK)
gradio-client>=0.8.0
gradio-pdf>=0.0.6

# Model-specific dependencies
safetensors>=0.4.0
# Pin bitsandbytes to avoid breaking changes with quantization
bitsandbytes>=0.41.0,<0.43.0  # Required for 4-bit and 8-bit quantization on GPU

# Optional: Flash Attention (for better performance with transformer models)
# Uncomment if you want flash attention (requires CUDA 11.8+ and compatible GPU)
# Note: Improves performance but adds build complexity
# flash-attn>=2.3.0  # Optional - improves performance but requires CUDA 11.8+

# Development/debugging
ipython>=8.17.0
ipdb>=0.13.0
debugpy>=1.7.0

# Security Tools (for security audits)
bandit>=1.7.5  # Security linter for Python code
safety>=2.3.5  # Dependency vulnerability scanner

# HTTP Client for ZeroGPU Chat API (aiohttp already included above)
# Note: No OpenAI client needed - using direct HTTP requests