Update requirements.txt
Browse files- requirements.txt +108 -1
requirements.txt
CHANGED
@@ -107,4 +107,111 @@ tabulate>=0.9.0
|
|
107 |
packaging>=23.1
|
108 |
|
109 |
jsonschema>=4.23.0
|
110 |
-
spacy==3.7.5
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
107 |
packaging>=23.1
|
108 |
|
109 |
jsonschema>=4.23.0
|
110 |
+
spacy==3.7.5
|
111 |
+
|
112 |
+
### PASTING IN CONTENTS OF OPTIONAL_LANGCHAIN
|
113 |
+
|
114 |
+
# optional for chat with PDF
|
115 |
+
langchain==0.2.6
|
116 |
+
langchain_experimental==0.0.62
|
117 |
+
langchain-community==0.2.6
|
118 |
+
langsmith==0.1.82
|
119 |
+
langchain-core==0.2.23
|
120 |
+
langchain-text-splitters==0.2.2
|
121 |
+
#langchain_huggingface==0.0.3
|
122 |
+
|
123 |
+
pypdf>=3.17.1
|
124 |
+
# avoid textract, requires old six
|
125 |
+
#textract==1.6.5
|
126 |
+
pypdfium2>=4.24.0
|
127 |
+
|
128 |
+
# for HF embeddings
|
129 |
+
sentence_transformers>=3.0.1
|
130 |
+
# https://github.com/h2oai/instructor-embedding/tree/h2ogpt
|
131 |
+
# pip wheel .
|
132 |
+
InstructorEmbedding @ https://h2o-release.s3.amazonaws.com/h2ogpt/InstructorEmbedding-1.0.1-py3-none-any.whl
|
133 |
+
# https://github.com/h2oai/sentence-transformers/tree/h2ogpt
|
134 |
+
# pip wheel .
|
135 |
+
sentence_transformers_old @ https://h2o-release.s3.amazonaws.com/h2ogpt/sentence_transformers_old-2.2.2-py3-none-any.whl
|
136 |
+
|
137 |
+
# optional: for OpenAI endpoint or embeddings (requires key)
|
138 |
+
replicate>=0.26.0
|
139 |
+
anthropic>=0.34.2
|
140 |
+
langchain-anthropic>=0.1.20
|
141 |
+
together>=1.1.5
|
142 |
+
langchain_together==0.1.3
|
143 |
+
langchain-openai>=0.1.8
|
144 |
+
langchain-google-genai>=1.0.8
|
145 |
+
google-generativeai>=0.7.2
|
146 |
+
google-ai-generativelanguage>=0.6.6
|
147 |
+
# pydantic version conflict
|
148 |
+
#mistral_common==1.3.3
|
149 |
+
|
150 |
+
llava @ https://h2o-release.s3.amazonaws.com/h2ogpt/llava-1.7.0.dev0-py3-none-any.whl
|
151 |
+
|
152 |
+
#langchain_mistralai==0.1.2 # tokenizers<0.16.0, but transformers requires >=0.19
|
153 |
+
httpx>=0.25.2
|
154 |
+
httpx-sse>=0.3.1
|
155 |
+
mistralai>=0.4.0
|
156 |
+
# pydantic issue, don't need yet
|
157 |
+
#mistral-common==1.0.2
|
158 |
+
|
159 |
+
groq>=0.5.0
|
160 |
+
langchain-groq>=0.1.5
|
161 |
+
|
162 |
+
# local vector db
|
163 |
+
chromadb==0.4.23
|
164 |
+
|
165 |
+
pydantic-settings>=2.1.0
|
166 |
+
|
167 |
+
# server vector db
|
168 |
+
#pymilvus==2.2.8
|
169 |
+
|
170 |
+
# weak url support, if can't install opencv etc. If comment-in this one, then comment-out unstructured[local-inference]==0.6.6
|
171 |
+
# unstructured==0.8.1
|
172 |
+
|
173 |
+
# strong support for images
|
174 |
+
# Requires on Ubuntu: sudo apt-get install libmagic-dev poppler-utils tesseract-ocr libtesseract-dev libreoffice
|
175 |
+
unstructured[local-inference]==0.12.5
|
176 |
+
unstructured[all-docs]==0.12.5
|
177 |
+
docx2txt==0.8
|
178 |
+
python-docx==1.1.0
|
179 |
+
#pdf2image==1.16.3
|
180 |
+
#pytesseract==0.3.10
|
181 |
+
pillow>=10.2.0
|
182 |
+
posthog
|
183 |
+
|
184 |
+
pdfminer.six==20231228
|
185 |
+
urllib3
|
186 |
+
requests_file
|
187 |
+
|
188 |
+
#pdf2image==1.16.3
|
189 |
+
#pytesseract==0.3.10
|
190 |
+
tabulate>=0.9.0
|
191 |
+
# FYI pandoc already part of requirements.txt
|
192 |
+
|
193 |
+
# JSONLoader, but makes some trouble for some users
|
194 |
+
# TRY: apt-get install autoconf libtool
|
195 |
+
# unclear what happens on windows/mac for now
|
196 |
+
jq>=1.4.1; platform_machine == "x86_64"
|
197 |
+
|
198 |
+
# to check licenses
|
199 |
+
# Run: pip-licenses|grep -v 'BSD\|Apache\|MIT'
|
200 |
+
pip-licenses>=4.3.0
|
201 |
+
|
202 |
+
# weaviate vector db
|
203 |
+
# required for httpx for mistralai
|
204 |
+
weaviate-client==3.26.2
|
205 |
+
|
206 |
+
# vllm==0.2.2
|
207 |
+
|
208 |
+
# only gradio>=4
|
209 |
+
gradio_pdf>=0.0.7
|
210 |
+
|
211 |
+
gradio_tools>=0.0.9
|
212 |
+
|
213 |
+
# Qdrant - https://qdrant.tech vector database
|
214 |
+
qdrant-client>=1.8.0
|
215 |
+
|
216 |
+
# MIT:
|
217 |
+
arxiv>=2.1.3
|