Spaces:
Paused
Paused
| # Requirements for DOLPHIN PDF AI - Local Gemma 3n Version with Voice Chat | |
| # Optimized for powerful GPU deployment with local models and voice functionality | |
| # Core PyTorch dependencies (updated versions from voice_chat) | |
| torch==2.3.1 | |
| torchvision==0.18.1 | |
| torchaudio==2.3.1 | |
| # Transformers and HuggingFace ecosystem | |
| transformers>=4.53.0 | |
| huggingface-hub>=0.20.0 | |
| tokenizers>=0.21.0 | |
| accelerate>=0.20.0 | |
| timm>=1.0.16 | |
| bitsandbytes>=0.41.0 | |
| datasets>=2.14.0 | |
| safetensors>=0.3.0 | |
| # Gradio (using beta version from voice_chat for compatibility) | |
| https://gradio-builds.s3.amazonaws.com/cffe9a7ab7f71e76d7214dc57c6278ffaf5bcdf9/gradio-5.0.0b1-py3-none-any.whl | |
| # Image processing | |
| Pillow>=10.0.0 | |
| opencv-python>=4.8.0 | |
| numpy>=1.24.0 | |
| # PDF processing | |
| PyMuPDF>=1.23.0 | |
| # RAG and embeddings | |
| sentence-transformers>=2.2.0 | |
| scikit-learn>=1.3.0 | |
| faiss-cpu>=1.7.4 | |
| # Text processing and markdown | |
| markdown>=3.5.0 | |
| python-markdown-math>=0.8 | |
| # Voice processing dependencies | |
| librosa==0.10.2.post1 | |
| soundfile==0.12.1 | |
| pydub==0.25.1 | |
| onnxruntime==1.19.0 | |
| gtts>=2.3.0 | |
| # Voice chat specific dependencies | |
| litgpt==0.4.3 | |
| snac==1.2.0 | |
| openai-whisper | |
| # Web framework dependencies | |
| fastapi==0.112.4 | |
| flask==3.0.3 | |
| streamlit==1.37.1 | |
| # Utilities | |
| tqdm>=4.66.0 | |
| requests>=2.31.0 | |
| packaging>=23.0 | |
| pyyaml>=6.0 | |
| fire | |
| # Optional but recommended for better performance | |
| # flash-attn>=2.0.0; platform_system != "Darwin" | |
| # xformers>=0.0.22; platform_system != "Darwin" | |
| # PyAudio==0.2.14 # Commented out as it can cause installation issues | |
| # Development and debugging | |
| ipython>=8.0.0 | |
| jupyter>=1.0.0 |