historical-ocr / requirements.txt
milwright's picture
modularize + nest scripts; reduce technical debt
94e74f0
raw
history blame contribute delete
569 Bytes
# Requirements for Historical OCR application
# Core dependencies
streamlit>=1.30.0
mistralai>=0.1.0 # Updated to latest Mistral AI SDK
pydantic>=2.5.0 # Updated for better BaseModel support
# Image processing
Pillow>=10.0.0
opencv-python-headless>=4.8.0.74
pdf2image>=1.16.0
pytesseract>=0.3.10 # For local OCR fallback
matplotlib>=3.7.0 # For visualization in preprocessing tests
# Data handling and utilities
numpy>=1.24.0
pycountry>=22.1.10
requests>=2.31.0
python-dotenv>=1.0.0
python-multipart>=0.0.6
# Type checking and linting
mypy>=1.5.0
ruff>=0.1.5