abugaber commited on
Commit
0bb348c
1 Parent(s): 3943768

Update requirements.txt

Browse files
Files changed (1) hide show
  1. requirements.txt +108 -1
requirements.txt CHANGED
@@ -107,4 +107,111 @@ tabulate>=0.9.0
107
  packaging>=23.1
108
 
109
  jsonschema>=4.23.0
110
- spacy==3.7.5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
107
  packaging>=23.1
108
 
109
  jsonschema>=4.23.0
110
+ spacy==3.7.5
111
+
112
+ ### PASTING IN CONTENTS OF OPTIONAL_LANGCHAIN
113
+
114
+ # optional for chat with PDF
115
+ langchain==0.2.6
116
+ langchain_experimental==0.0.62
117
+ langchain-community==0.2.6
118
+ langsmith==0.1.82
119
+ langchain-core==0.2.23
120
+ langchain-text-splitters==0.2.2
121
+ #langchain_huggingface==0.0.3
122
+
123
+ pypdf>=3.17.1
124
+ # avoid textract, requires old six
125
+ #textract==1.6.5
126
+ pypdfium2>=4.24.0
127
+
128
+ # for HF embeddings
129
+ sentence_transformers>=3.0.1
130
+ # https://github.com/h2oai/instructor-embedding/tree/h2ogpt
131
+ # pip wheel .
132
+ InstructorEmbedding @ https://h2o-release.s3.amazonaws.com/h2ogpt/InstructorEmbedding-1.0.1-py3-none-any.whl
133
+ # https://github.com/h2oai/sentence-transformers/tree/h2ogpt
134
+ # pip wheel .
135
+ sentence_transformers_old @ https://h2o-release.s3.amazonaws.com/h2ogpt/sentence_transformers_old-2.2.2-py3-none-any.whl
136
+
137
+ # optional: for OpenAI endpoint or embeddings (requires key)
138
+ replicate>=0.26.0
139
+ anthropic>=0.34.2
140
+ langchain-anthropic>=0.1.20
141
+ together>=1.1.5
142
+ langchain_together==0.1.3
143
+ langchain-openai>=0.1.8
144
+ langchain-google-genai>=1.0.8
145
+ google-generativeai>=0.7.2
146
+ google-ai-generativelanguage>=0.6.6
147
+ # pydantic version conflict
148
+ #mistral_common==1.3.3
149
+
150
+ llava @ https://h2o-release.s3.amazonaws.com/h2ogpt/llava-1.7.0.dev0-py3-none-any.whl
151
+
152
+ #langchain_mistralai==0.1.2 # tokenizers<0.16.0, but transformers requires >=0.19
153
+ httpx>=0.25.2
154
+ httpx-sse>=0.3.1
155
+ mistralai>=0.4.0
156
+ # pydantic issue, don't need yet
157
+ #mistral-common==1.0.2
158
+
159
+ groq>=0.5.0
160
+ langchain-groq>=0.1.5
161
+
162
+ # local vector db
163
+ chromadb==0.4.23
164
+
165
+ pydantic-settings>=2.1.0
166
+
167
+ # server vector db
168
+ #pymilvus==2.2.8
169
+
170
+ # weak url support, if can't install opencv etc. If comment-in this one, then comment-out unstructured[local-inference]==0.6.6
171
+ # unstructured==0.8.1
172
+
173
+ # strong support for images
174
+ # Requires on Ubuntu: sudo apt-get install libmagic-dev poppler-utils tesseract-ocr libtesseract-dev libreoffice
175
+ unstructured[local-inference]==0.12.5
176
+ unstructured[all-docs]==0.12.5
177
+ docx2txt==0.8
178
+ python-docx==1.1.0
179
+ #pdf2image==1.16.3
180
+ #pytesseract==0.3.10
181
+ pillow>=10.2.0
182
+ posthog
183
+
184
+ pdfminer.six==20231228
185
+ urllib3
186
+ requests_file
187
+
188
+ #pdf2image==1.16.3
189
+ #pytesseract==0.3.10
190
+ tabulate>=0.9.0
191
+ # FYI pandoc already part of requirements.txt
192
+
193
+ # JSONLoader, but makes some trouble for some users
194
+ # TRY: apt-get install autoconf libtool
195
+ # unclear what happens on windows/mac for now
196
+ jq>=1.4.1; platform_machine == "x86_64"
197
+
198
+ # to check licenses
199
+ # Run: pip-licenses|grep -v 'BSD\|Apache\|MIT'
200
+ pip-licenses>=4.3.0
201
+
202
+ # weaviate vector db
203
+ # required for httpx for mistralai
204
+ weaviate-client==3.26.2
205
+
206
+ # vllm==0.2.2
207
+
208
+ # only gradio>=4
209
+ gradio_pdf>=0.0.7
210
+
211
+ gradio_tools>=0.0.9
212
+
213
+ # Qdrant - https://qdrant.tech vector database
214
+ qdrant-client>=1.8.0
215
+
216
+ # MIT:
217
+ arxiv>=2.1.3