Spaces:
Running
Running
Update requirements.txt
Browse files- requirements.txt +19 -45
requirements.txt
CHANGED
@@ -1,45 +1,19 @@
|
|
1 |
-
|
2 |
-
|
3 |
-
|
4 |
-
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
11 |
-
|
12 |
-
|
13 |
-
|
14 |
-
|
15 |
-
|
16 |
-
|
17 |
-
|
18 |
-
|
19 |
-
|
20 |
-
pdf2image==1.17.0
|
21 |
-
pymupdf==1.24.0
|
22 |
-
pdfplumber==0.11.0
|
23 |
-
|
24 |
-
# Image processing and computer vision
|
25 |
-
opencv-python==4.10.0.84
|
26 |
-
numpy==1.26.4
|
27 |
-
ftfy==6.1.1
|
28 |
-
regex==2023.12.25
|
29 |
-
|
30 |
-
# Document processing
|
31 |
-
python-docx==1.1.2
|
32 |
-
python-pptx==0.6.23
|
33 |
-
|
34 |
-
# Additional utilities
|
35 |
-
requests==2.32.3
|
36 |
-
torch==2.4.0
|
37 |
-
torchvision==0.19.0
|
38 |
-
|
39 |
-
# For better PDF extraction (optional - can be commented out if issues)
|
40 |
-
# detectron2 @ git+https://github.com/facebookresearch/detectron2.git
|
41 |
-
# layoutparser[paddlepaddle]==0.3.4
|
42 |
-
|
43 |
-
# Essential for text processing
|
44 |
-
tiktoken==0.7.0
|
45 |
-
charset-normalizer==3.3.2
|
|
|
1 |
+
unstructured[pdf]
|
2 |
+
unstructured-inference
|
3 |
+
pillow
|
4 |
+
numpy>=1.26.2,<3.0
|
5 |
+
unidecode==1.3.8
|
6 |
+
accelerate==1.5.2
|
7 |
+
pypdf==5.4.0
|
8 |
+
sentence-transformers==3.4.1
|
9 |
+
gradio==5.24.0
|
10 |
+
langchain_community==0.3.21
|
11 |
+
chromadb==1.0.4
|
12 |
+
PyPDF2==3.0.1
|
13 |
+
fitz==0.0.1.dev2
|
14 |
+
ipdb==0.13.13
|
15 |
+
langchain==0.3.23
|
16 |
+
huggingface_hub
|
17 |
+
langchain-huggingface==0.1.2
|
18 |
+
faiss-gpu-cu12 # CUDA 12.x, Python 3.8+
|
19 |
+
faiss-gpu-cu11 # CUDA 11.x, Python 3.8+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|