Spaces:
Running
Running
Update requirements.txt
Browse files- requirements.txt +31 -23
requirements.txt
CHANGED
@@ -1,40 +1,48 @@
|
|
1 |
# ===== CORE API =====
|
2 |
-
fastapi==0.
|
3 |
-
uvicorn==0.
|
4 |
python-multipart==0.0.6
|
5 |
python-dotenv==1.0.0
|
6 |
|
7 |
-
# ===== AI/ML (
|
8 |
-
torch==
|
9 |
-
transformers==4.
|
10 |
-
diffusers==0.
|
11 |
-
huggingface-hub==0.
|
12 |
-
accelerate==0.
|
|
|
13 |
|
14 |
# ===== AUDIO PROCESSING =====
|
15 |
soundfile==0.12.1
|
16 |
-
librosa==0.
|
17 |
-
gTTS==2.
|
18 |
-
SpeechRecognition==3.
|
19 |
pydub==0.25.1
|
|
|
20 |
|
21 |
# ===== IMAGE/VIDEO =====
|
22 |
-
Pillow==
|
23 |
-
imageio[ffmpeg]==2.
|
24 |
-
imageio-ffmpeg==0.4.
|
25 |
moviepy==1.0.3
|
26 |
-
opencv-python-headless==4.
|
|
|
|
|
|
|
|
|
|
|
27 |
|
28 |
# ===== UTILITIES =====
|
|
|
|
|
|
|
29 |
langdetect==1.0.9
|
30 |
-
|
31 |
-
numpy==1.26.3
|
32 |
-
tqdm==4.66.1
|
33 |
-
requests==2.31.0
|
34 |
|
35 |
# ===== GRADIO INTERFACE =====
|
36 |
-
gradio==
|
37 |
|
38 |
-
# ===== OPTIONAL =====
|
39 |
-
#
|
40 |
-
#
|
|
|
|
1 |
# ===== CORE API =====
|
2 |
+
fastapi==0.95.2
|
3 |
+
uvicorn==0.22.0
|
4 |
python-multipart==0.0.6
|
5 |
python-dotenv==1.0.0
|
6 |
|
7 |
+
# ===== AI/ML (CORE MODELS) =====
|
8 |
+
torch==1.13.1 --extra-index-url https://download.pytorch.org/whl/cpu
|
9 |
+
transformers==4.28.1
|
10 |
+
diffusers==0.17.1
|
11 |
+
huggingface-hub==0.13.4
|
12 |
+
accelerate==0.18.0
|
13 |
+
sentencepiece==0.1.99 # Required for translation models
|
14 |
|
15 |
# ===== AUDIO PROCESSING =====
|
16 |
soundfile==0.12.1
|
17 |
+
librosa==0.9.2
|
18 |
+
gTTS==2.3.2
|
19 |
+
SpeechRecognition==3.8.1
|
20 |
pydub==0.25.1
|
21 |
+
webrtcvad==2.0.10 # Voice activity detection
|
22 |
|
23 |
# ===== IMAGE/VIDEO =====
|
24 |
+
Pillow==9.5.0
|
25 |
+
imageio[ffmpeg]==2.31.1
|
26 |
+
imageio-ffmpeg==0.4.8
|
27 |
moviepy==1.0.3
|
28 |
+
opencv-python-headless==4.7.0.72
|
29 |
+
|
30 |
+
# ===== DOCUMENT PROCESSING =====
|
31 |
+
pymupdf==1.22.5
|
32 |
+
python-docx==1.1.0 # For Word files
|
33 |
+
pdf2image==1.17.0 # PDF to image conversion
|
34 |
|
35 |
# ===== UTILITIES =====
|
36 |
+
numpy==1.23.5
|
37 |
+
tqdm==4.65.0
|
38 |
+
requests==2.28.2
|
39 |
langdetect==1.0.9
|
40 |
+
protobuf==3.20.3 # Required for some Hugging Face models
|
|
|
|
|
|
|
41 |
|
42 |
# ===== GRADIO INTERFACE =====
|
43 |
+
gradio==3.41.0
|
44 |
|
45 |
+
# ===== OPTIONAL (UNCOMMENT IF NEEDED) =====
|
46 |
+
# scipy==1.10.1 # Advanced audio features
|
47 |
+
# pandas==1.5.3 # For CSV processing
|
48 |
+
# openai-whisper==20230314 # Alternative speech recognition
|