Muzammil6376 commited on
Commit
840ffdd
·
verified ·
1 Parent(s): 7154bdc

Update requirements.txt

Browse files
Files changed (1) hide show
  1. requirements.txt +48 -14
requirements.txt CHANGED
@@ -1,14 +1,48 @@
1
- gradio
2
- langchain>=0.2.0
3
- langchain-community
4
- huggingface_hub
5
- unstructured
6
- pdfminer.six
7
- pi-heif
8
- unstructured-inference
9
- PyMuPDF
10
- pdf2image
11
- pytesseract
12
- transformers
13
- sentence-transformers
14
- faiss-cpu
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Core dependencies for multimodal RAG system
2
+ gradio==4.44.0
3
+ huggingface-hub==0.25.0
4
+ transformers==4.45.0
5
+
6
+ # LangChain dependencies
7
+ langchain==0.3.0
8
+ langchain-community==0.3.0
9
+ langchain-core==0.3.0
10
+ langchain-text-splitters==0.3.0
11
+ langchain-huggingface==0.1.0
12
+
13
+ # Vector store and multimodal embeddings
14
+ faiss-cpu==1.8.0
15
+ sentence-transformers==3.0.1
16
+ clip-by-openai==1.0
17
+
18
+ # PDF processing and multimodal support
19
+ unstructured[pdf]==0.15.12
20
+ pillow==10.4.0
21
+ pdf2image==1.17.0
22
+ pymupdf==1.24.0
23
+ pdfplumber==0.11.0
24
+
25
+ # Image processing and computer vision
26
+ opencv-python==4.10.0.84
27
+ numpy==1.26.4
28
+ ftfy==6.1.1
29
+ regex==2023.12.25
30
+
31
+ # Document processing
32
+ python-docx==1.1.2
33
+ python-pptx==0.6.23
34
+
35
+ # Additional utilities
36
+ requests==2.32.3
37
+ torch==2.4.0
38
+ torchvision==0.19.0
39
+
40
+ # For better PDF extraction
41
+ #detectron2 @ git+https://github.com/facebookresearch/detectron2.git
42
+ #layoutparser[paddlepaddle]==0.3.4
43
+
44
+ # System dependencies (these might be needed for unstructured)
45
+ poppler-utils
46
+ #tesseract-ocr
47
+ #libgl1-mesa-glx
48
+ #libglib2.0-0