|
# FastAPI and server |
|
fastapi==0.104.1 |
|
uvicorn==0.24.0 |
|
python-multipart==0.0.6 |
|
|
|
# ML and NLP models |
|
transformers==4.35.2 |
|
sentence-transformers==2.2.2 |
|
|
|
# PyTorch |
|
torch==2.1.1 |
|
protobuf==3.20.3 |
|
|
|
# Text processing and embedding utilities |
|
scikit-learn==1.3.2 |
|
numpy>=1.26.4,<2.0 |
|
|
|
# Data validation and API models |
|
pydantic==2.5.0 |
|
|
|
# HTTP requests |
|
requests==2.31.0 |
|
huggingface_hub==0.25.2 |
|
|
|
# Additional text processing |
|
nltk==3.8.1 |
|
|
|
# Vector storage - Modern versions WITHOUT deprecated plugins |
|
pinecone |
|
langchain-pinecone |
|
langchain |
|
langchain-community |
|
|
|
# LLM integration |
|
google-generativeai>=0.8.5 |
|
|
|
# Tokenization |
|
tokenizers==0.15.0 |
|
|
|
# Async processing |
|
asyncio-mqtt==0.13.0 |
|
|
|
# Environment variables |
|
python-dotenv>=1.0.0 |
|
|
|
# NEW PACKAGES FOR PDF PROCESSING (Only additions) |
|
PyPDF2 |
|
aiofiles |
|
httpx |
|
requests |