mirror of
https://github.com/opendatalab/MinerU.git
synced 2026-03-27 11:08:32 +07:00
- Optimize paragraph splitting algorithm for better text block separation - Update fast-langdetect dependency to ensure compatibility
14 lines
391 B
Plaintext
14 lines
391 B
Plaintext
boto3>=1.28.43
|
|
Brotli>=1.1.0
|
|
click>=8.1.7
|
|
fast-langdetect>=0.2.3,<0.3.0
|
|
loguru>=0.6.0
|
|
numpy>=1.21.6,<2.0.0
|
|
pydantic>=2.7.2
|
|
PyMuPDF>=1.24.9,<=1.24.14
|
|
scikit-learn>=1.0.2
|
|
torch>=2.2.2
|
|
transformers
|
|
pdfminer.six==20231228
|
|
# The requirements.txt must ensure that only necessary external dependencies are introduced. If there are new dependencies to add, please contact the project administrator.
|