Commit 963d0be1 authored by myhloli's avatar myhloli
Browse files

build(Dockerfile): update model download script and dependencies

- Update the URL for downloading the model setup script in Dockerfile
- Upgrade struct-eqtable to version 0.3.2 and remove pypandoc
- Add new dependencies: einops, accelerate, doclayout_yolo, rapidocr-paddle, and rapid_table
parent fe7b811b
...@@ -42,7 +42,7 @@ RUN /bin/bash -c "wget https://gitee.com/myhloli/MinerU/raw/master/magic-pdf.tem ...@@ -42,7 +42,7 @@ RUN /bin/bash -c "wget https://gitee.com/myhloli/MinerU/raw/master/magic-pdf.tem
# Download models and update the configuration file # Download models and update the configuration file
RUN /bin/bash -c "pip3 install modelscope && \ RUN /bin/bash -c "pip3 install modelscope && \
wget https://gitee.com/myhloli/MinerU/raw/master/docs/download_models.py && \ wget https://gitee.com/myhloli/MinerU/raw/master/scripts/download_models.py && \
python3 download_models.py && \ python3 download_models.py && \
sed -i 's|/tmp/models|/root/.cache/modelscope/hub/opendatalab/PDF-Extract-Kit/models|g' /root/magic-pdf.json && \ sed -i 's|/tmp/models|/root/.cache/modelscope/hub/opendatalab/PDF-Extract-Kit/models|g' /root/magic-pdf.json && \
sed -i 's|cpu|cuda|g' /root/magic-pdf.json" sed -i 's|cpu|cuda|g' /root/magic-pdf.json"
......
...@@ -12,7 +12,11 @@ matplotlib ...@@ -12,7 +12,11 @@ matplotlib
ultralytics ultralytics
paddleocr==2.7.3 paddleocr==2.7.3
paddlepaddle==3.0.0b1 paddlepaddle==3.0.0b1
pypandoc struct-eqtable==0.3.2
struct-eqtable==0.1.0 einops
accelerate
doclayout_yolo==0.0.2
rapidocr-paddle
rapid_table
doclayout-yolo==0.0.2 doclayout-yolo==0.0.2
detectron2 detectron2
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment