Spaces:
Paused
Paused
# Requirements for DOLPHIN PDF AI - Local Gemma 3n Version with Voice Chat | |
# Optimized for powerful GPU deployment with local models and voice functionality | |
# Core PyTorch dependencies (updated versions from voice_chat) | |
torch==2.3.1 | |
torchvision==0.18.1 | |
torchaudio==2.3.1 | |
# Transformers and HuggingFace ecosystem | |
transformers>=4.53.0 | |
huggingface-hub>=0.20.0 | |
tokenizers>=0.21.0 | |
accelerate>=0.20.0 | |
timm>=1.0.16 | |
bitsandbytes>=0.41.0 | |
datasets>=2.14.0 | |
safetensors>=0.3.0 | |
# Gradio (using beta version from voice_chat for compatibility) | |
https://gradio-builds.s3.amazonaws.com/cffe9a7ab7f71e76d7214dc57c6278ffaf5bcdf9/gradio-5.0.0b1-py3-none-any.whl | |
# Image processing | |
Pillow>=10.0.0 | |
opencv-python>=4.8.0 | |
numpy>=1.24.0 | |
# PDF processing | |
PyMuPDF>=1.23.0 | |
# RAG and embeddings | |
sentence-transformers>=2.2.0 | |
scikit-learn>=1.3.0 | |
faiss-cpu>=1.7.4 | |
# Text processing and markdown | |
markdown>=3.5.0 | |
python-markdown-math>=0.8 | |
# Voice processing dependencies | |
librosa==0.10.2.post1 | |
soundfile==0.12.1 | |
pydub==0.25.1 | |
onnxruntime==1.19.0 | |
gtts>=2.3.0 | |
# Voice chat specific dependencies | |
litgpt==0.4.3 | |
snac==1.2.0 | |
openai-whisper | |
# Web framework dependencies | |
fastapi==0.112.4 | |
flask==3.0.3 | |
streamlit==1.37.1 | |
# Utilities | |
tqdm>=4.66.0 | |
requests>=2.31.0 | |
packaging>=23.0 | |
pyyaml>=6.0 | |
fire | |
# Optional but recommended for better performance | |
# flash-attn>=2.0.0; platform_system != "Darwin" | |
# xformers>=0.0.22; platform_system != "Darwin" | |
# PyAudio==0.2.14 # Commented out as it can cause installation issues | |
# Development and debugging | |
ipython>=8.0.0 | |
jupyter>=1.0.0 |