Abhinav Gavireddi commited on
Commit
8c61032
·
1 Parent(s): 33f4e34

fix: fixed issue with package versions

Browse files
Files changed (3) hide show
  1. .gitignore +3 -0
  2. Dockerfile +8 -1
  3. requirements.txt +0 -2
.gitignore CHANGED
@@ -172,3 +172,6 @@ cython_debug/
172
 
173
  # PyPI configuration file
174
  .pypirc
 
 
 
 
172
 
173
  # PyPI configuration file
174
  .pypirc
175
+
176
+ # jupyter notebooks
177
+ *.ipynb
Dockerfile CHANGED
@@ -12,15 +12,22 @@ RUN apt-get update && \
12
  apt-get install -y --no-install-recommends \
13
  build-essential \
14
  ffmpeg \
15
-
16
  # for hnswlib (needed for OpenMP)
17
  libgomp1 \
 
 
18
  && rm -rf /var/lib/apt/lists/*
19
 
20
  # Copy and install Python dependencies
21
  COPY requirements.txt ./
22
  RUN pip install --no-cache-dir -r requirements.txt
23
 
 
 
 
 
 
 
24
  # Copy application code
25
  COPY src/ ./src/
26
  COPY tests/ ./tests/
 
12
  apt-get install -y --no-install-recommends \
13
  build-essential \
14
  ffmpeg \
 
15
  # for hnswlib (needed for OpenMP)
16
  libgomp1 \
17
+ curl \
18
+ git \
19
  && rm -rf /var/lib/apt/lists/*
20
 
21
  # Copy and install Python dependencies
22
  COPY requirements.txt ./
23
  RUN pip install --no-cache-dir -r requirements.txt
24
 
25
+ # Install/patch MinerU and download models
26
+ RUN pip uninstall -y magic-pdf && \
27
+ pip install git+https://github.com/opendatalab/MinerU.git@dev && \
28
+ curl -L https://github.com/opendatalab/MinerU/raw/dev/scripts/download_models_hf.py -o download_models_hf.py && \
29
+ python download_models_hf.py
30
+
31
  # Copy application code
32
  COPY src/ ./src/
33
  COPY tests/ ./tests/
requirements.txt CHANGED
@@ -1,9 +1,7 @@
1
  # Core
2
  streamlit>=1.25.0
3
- mineru>=0.1.0
4
  sentence-transformers>=2.2.2
5
  rank-bm25>=0.2.2
6
- redis>=4.5.1
7
  hnswlib>=0.7.0
8
  transformers>=4.29.2
9
  torch>=2.0.0
 
1
  # Core
2
  streamlit>=1.25.0
 
3
  sentence-transformers>=2.2.2
4
  rank-bm25>=0.2.2
 
5
  hnswlib>=0.7.0
6
  transformers>=4.29.2
7
  torch>=2.0.0