mirror of
https://github.com/opendatalab/MinerU.git
synced 2026-03-27 11:08:32 +07:00
- Remove unused functions such as split_long_words, ocr_mk_mm_markdown_with_para, etc. - Simplify ocr_mk_markdown_with_para_core_v2 by removing unnecessary language detection and word splitting logic- Remove wordninja dependency from requirements - Update ocr_model_init to include additional parameters for OCR model configuration
14 lines
389 B
Plaintext
14 lines
389 B
Plaintext
boto3>=1.28.43
|
|
Brotli>=1.1.0
|
|
click>=8.1.7
|
|
fast-langdetect==0.2.0
|
|
loguru>=0.6.0
|
|
numpy>=1.21.6,<2.0.0
|
|
pdfminer.six==20231228
|
|
pydantic>=2.7.2,<2.8.0
|
|
PyMuPDF>=1.24.9
|
|
scikit-learn>=1.0.2
|
|
torch>=2.2.2,<=2.3.1
|
|
transformers
|
|
# The requirements.txt must ensure that only necessary external dependencies are introduced. If there are new dependencies to add, please contact the project administrator.
|