mirror of
https://github.com/opendatalab/MinerU.git
synced 2026-03-27 11:08:32 +07:00
Commit Graph
Select branches
Hide Pull Requests
add_docx
cla
copilot/analyze-issue-4433
dev
gh-pages
master
realese-0.8.0
release-0.10.0
release-0.10.1
release-0.10.2
release-0.10.3
release-0.10.4
release-0.10.5
release-0.10.6
release-0.9.0
release-0.9.1
release-0.9.2
release-0.9.3
release-1.0.0
release-1.1.0
release-1.2.0
release-1.2.1
release-1.2.2
release-1.3.0
release-1.3.1
release-1.3.10
release-1.3.11
release-1.3.12
release-1.3.2
release-1.3.3
release-1.3.4
release-1.3.5
release-1.3.6
release-1.3.7
release-1.3.8
release-1.3.9
release-2.0.0
release-2.0.1
release-2.0.2
release-2.0.3
release-2.0.4
release-2.0.5
release-2.0.6
release-2.1.0
release-2.1.1
release-2.1.10
release-2.1.2
release-2.1.3
release-2.1.4
release-2.1.5
release-2.1.6
release-2.1.7
release-2.1.8
release-2.1.9
release-2.2.0
release-2.2.1
release-2.2.2
release-2.5.0
release-2.5.1
release-2.5.2
release-2.5.3
release-2.5.4
release-2.6.0
release-2.6.1
release-2.6.2
release-2.6.3
release-2.6.4
release-2.6.5
release-2.6.6
release-2.6.7
release-2.7.0
release-2.7.1
release-2.7.2
release-2.7.3
release-2.7.4
release-2.7.6
#1
#10
#100
#1001
#1006
#101
#1010
#1011
#1012
#1013
#1016
#1018
#102
#1024
#1027
#103
#1036
#104
#1045
#1046
#1047
#1048
#1049
#105
#1050
#1052
#1053
#1054
#1056
#1058
#1059
#106
#1060
#1061
#1062
#1063
#1064
#1065
#1066
#107
#1071
#1074
#1075
#1076
#1077
#108
#1082
#1086
#1088
#1089
#1094
#1095
#1098
#1099
#11
#110
#1100
#1101
#1102
#1104
#1105
#1106
#111
#1110
#1112
#1113
#1116
#1117
#1119
#112
#1120
#1121
#113
#1130
#1132
#1134
#1135
#1136
#1137
#1138
#1139
#114
#1140
#1141
#1143
#1147
#115
#1152
#1153
#1154
#1156
#116
#1164
#1165
#1166
#1167
#117
#1170
#1177
#1178
#118
#119
#1193
#1198
#12
#120
#1201
#1207
#1208
#1209
#1211
#1212
#1213
#1214
#1215
#1216
#1218
#1222
#1224
#1228
#1231
#1232
#1238
#1239
#1243
#1247
#1252
#1255
#1256
#1257
#1258
#1259
#1260
#1261
#1262
#1263
#1264
#1265
#1266
#1267
#1268
#1272
#1275
#1276
#1277
#1278
#1280
#1281
#1284
#1289
#1291
#1292
#1299
#1299
#13
#130
#1301
#1304
#131
#1311
#1312
#1313
#1318
#132
#1321
#1322
#1323
#1325
#1328
#1329
#133
#1330
#1336
#1337
#1338
#1352
#1362
#1365
#1370
#1379
#138
#1380
#1386
#139
#1397
#1398
#14
#140
#141
#1412
#1414
#1419
#1420
#1421
#1422
#1423
#1424
#1425
#1426
#1427
#1428
#1429
#1430
#1431
#1436
#1437
#1438
#1439
#1440
#1448
#1449
#1450
#1451
#1452
#1453
#1454
#1459
#1460
#1462
#1464
#1465
#1468
#1469
#1470
#1471
#1472
#1473
#1474
#1475
#1476
#1477
#1479
#1481
#1482
#1483
#1484
#1486
#1487
#1490
#1492
#1493
#1494
#1495
#1496
#1497
#1498
#1499
#15
#1500
#1510
#1511
#1512
#1513
#1515
#1516
#1517
#1520
#1521
#1531
#1532
#1533
#1534
#1535
#1537
#1538
#1542
#1543
#1546
#1547
#1549
#1550
#1551
#1553
#1554
#1556
#1557
#1565
#1567
#1569
#1570
#1571
#1578
#1580
#1582
#1588
#1590
#1591
#1592
#1593
#1594
#1595
#16
#160
#1601
#1602
#1606
#1607
#1612
#1613
#1614
#1616
#1617
#1618
#1619
#1621
#1622
#1631
#1636
#1648
#1661
#1664
#1672
#168
#1682
#1683
#1689
#169
#1693
#17
#1701
#1703
#1704
#171
#1711
#172
#1734
#1737
#1738
#1743
#1748
#1750
#1753
#1757
#1759
#1760
#1761
#1762
#1767
#1769
#1770
#1771
#1776
#1777
#1778
#1785
#1787
#1788
#1789
#1790
#1792
#1793
#1799
#18
#1810
#1810
#1821
#1822
#1823
#1824
#1825
#1827
#1828
#1829
#1838
#1839
#1841
#1863
#1883
#189
#1894
#1897
#19
#1906
#1910
#1919
#1944
#1948
#1950
#1955
#1956
#1957
#1958
#1959
#1970
#1974
#1975
#1980
#1981
#1982
#1984
#1985
#1986
#2
#20
#2003
#2004
#2010
#2062
#2063
#2064
#2065
#2066
#2069
#2070
#2071
#2072
#2073
#2074
#2077
#2078
#2079
#2080
#2081
#2082
#2083
#2084
#2086
#2087
#2088
#2089
#2090
#2091
#2092
#2093
#21
#2114
#2115
#2124
#2125
#2126
#2128
#214
#2142
#2144
#2145
#2146
#2147
#2148
#215
#2151
#2152
#2153
#2154
#2155
#2156
#2157
#2166
#2170
#2172
#2173
#2174
#2177
#2178
#2189
#2193
#2194
#2195
#2196
#2197
#2198
#2199
#22
#2201
#2205
#2206
#2207
#2208
#2214
#2215
#2217
#2220
#2223
#2224
#2225
#2226
#2227
#2231
#2232
#2234
#2239
#2240
#2250
#2251
#2252
#2253
#2254
#2255
#2256
#2264
#2265
#2266
#2267
#2269
#2273
#2274
#2297
#2298
#23
#231
#2311
#2314
#2315
#2316
#2352
#2353
#2354
#2355
#2356
#2365
#2367
#2380
#2381
#2382
#2383
#2384
#2385
#2386
#2387
#2388
#2389
#2395
#24
#2402
#2403
#2404
#2405
#2406
#2410
#2411
#2423
#2429
#2437
#2440
#2446
#2449
#2450
#2451
#2464
#2465
#2466
#2467
#2468
#2487
#25
#2501
#2505
#2506
#2510
#2511
#2512
#2513
#2514
#2519
#2526
#2526
#2536
#2550
#2562
#2566
#2570
#2571
#2575
#2578
#258
#2591
#26
#2609
#2611
#2613
#2614
#2616
#2620
#2622
#2623
#2624
#2625
#2626
#2627
#2628
#2629
#2630
#2631
#2632
#2633
#2634
#2635
#2636
#2638
#2639
#264
#2644
#2645
#2646
#2648
#2649
#2650
#2652
#2653
#2654
#2655
#2656
#2659
#2660
#2667
#2668
#2675
#2676
#2679
#2680
#2681
#2686
#2688
#2691
#2695
#2696
#2698
#27
#2703
#2704
#2705
#2706
#2707
#2719
#2721
#2722
#2727
#2729
#2733
#2736
#2740
#2742
#2751
#2752
#2753
#2754
#2755
#2756
#2757
#2758
#2763
#2767
#2768
#2777
#2780
#2783
#2787
#2788
#2789
#2790
#28
#2813
#2814
#2815
#2824
#2825
#2826
#2831
#2833
#2834
#2836
#2837
#284
#2840
#2842
#2843
#2844
#2845
#2850
#2852
#2854
#2857
#2858
#2859
#286
#2861
#2870
#2873
#2878
#2879
#2881
#2887
#2889
#2890
#2891
#2892
#2893
#2894
#2895
#2896
#2897
#2898
#2899
#29
#2900
#2901
#2903
#2904
#2905
#2906
#2907
#2908
#291
#2914
#2923
#2931
#2932
#2937
#2940
#2941
#2943
#2948
#2975
#2989
#2990
#3
#30
#3016
#3017
#3018
#3019
#3020
#3023
#3024
#3026
#3028
#3029
#3030
#3032
#3033
#3034
#3035
#3036
#3037
#3038
#3039
#3040
#3041
#3042
#3043
#3044
#3045
#3046
#3048
#3052
#3053
#3054
#3056
#3057
#306
#3060
#3061
#3062
#3063
#3064
#3065
#3067
#3068
#3069
#3070
#3071
#3072
#3073
#3074
#3075
#3076
#3077
#3091
#3093
#3095
#3096
#3099
#31
#3100
#3105
#3124
#3125
#3126
#3128
#3129
#3137
#3138
#3139
#314
#3140
#3141
#3143
#3144
#3145
#3149
#3150
#3151
#3154
#3155
#3156
#3158
#3167
#3172
#3173
#3174
#3175
#3181
#3182
#3183
#3184
#3186
#3187
#3189
#3190
#3196
#3197
#3198
#32
#3201
#3213
#3214
#3218
#3222
#3224
#3228
#3229
#3237
#3239
#3240
#3241
#3242
#3269
#3275
#3277
#3281
#329
#3291
#33
#3314
#3315
#3321
#3324
#3325
#3335
#3336
#3339
#3340
#3354
#3361
#3365
#3371
#3372
#3374
#3382
#3383
#3384
#3388
#3396
#3397
#34
#3405
#3406
#3407
#3419
#3420
#3421
#3423
#3424
#3425
#3426
#3427
#3428
#3429
#3435
#3437
#3438
#3442
#3448
#3449
#3450
#3451
#3473
#3477
#3489
#3490
#3498
#3499
#35
#350
#3501
#3502
#3503
#3504
#3505
#3506
#3507
#3508
#3509
#3510
#3511
#3512
#3513
#3514
#3515
#3516
#3517
#3523
#3527
#3529
#3532
#3533
#3534
#3535
#354
#3544
#3545
#3546
#3549
#355
#3550
#3551
#3552
#3553
#3554
#3555
#3556
#3557
#3558
#3563
#36
#3606
#3607
#3608
#3609
#3610
#3615
#3619
#3630
#3635
#3649
#3650
#3651
#3671
#3672
#3688
#3697
#3698
#3699
#37
#3700
#3701
#3703
#3706
#3706
#3707
#3708
#3709
#371
#3711
#3722
#3723
#3737
#3739
#374
#3740
#3742
#3748
#3750
#3752
#3754
#3755
#3756
#3760
#3761
#3762
#3766
#3767
#3768
#3769
#3770
#3779
#379
#38
#3803
#3804
#3805
#3806
#3812
#3814
#3819
#3820
#3821
#3822
#3823
#3824
#3825
#3828
#3829
#3830
#3831
#3833
#3834
#3835
#3836
#3837
#3841
#3842
#3851
#3854
#3855
#386
#3860
#3870
#3873
#3880
#3886
#3887
#3888
#3891
#3892
#3895
#3897
#3898
#3899
#39
#3900
#3902
#3903
#3904
#3905
#3918
#3919
#3931
#3932
#3933
#3934
#3946
#3950
#396
#3963
#3964
#3966
#3967
#397
#3972
#3974
#3975
#3976
#398
#3980
#3990
#3995
#3997
#4
#40
#400
#401
#404
#4040
#4046
#4062
#4063
#4065
#4066
#4067
#4068
#4069
#4070
#4073
#4074
#4076
#4077
#4078
#4081
#4082
#4083
#409
#4096
#4098
#4099
#41
#410
#4100
#4101
#4102
#4103
#4104
#4105
#4106
#4112
#4114
#4115
#4133
#4137
#4140
#4141
#4144
#417
#417
#4170
#4171
#4172
#4175
#4176
#4177
#4178
#4179
#418
#4192
#4193
#4194
#4196
#42
#4231
#4239
#4241
#4244
#4267
#4268
#4270
#4271
#4272
#4273
#4277
#4283
#4284
#4285
#4286
#4287
#4292
#4293
#4299
#43
#4301
#4303
#4304
#4305
#4306
#4308
#4309
#4310
#4318
#4330
#4349
#4353
#4357
#4358
#4359
#4365
#4367
#4368
#4386
#4388
#44
#4403
#4404
#4405
#4406
#4407
#4408
#4409
#4410
#4411
#4417
#4418
#4419
#4420
#4421
#4430
#4432
#4434
#4435
#4438
#4446
#4448
#4450
#4451
#4452
#4453
#4454
#4455
#4456
#4457
#4458
#4459
#4468
#447
#4471
#4473
#4474
#4475
#448
#4498
#4499
#45
#4500
#4503
#4504
#4505
#4507
#4508
#4513
#4518
#4523
#4525
#4526
#4544
#4555
#4559
#4560
#4564
#4569
#4575
#458
#4584
#4586
#4592
#4593
#4595
#4596
#46
#4622
#4626
#463
#4631
#4635
#4636
#4637
#4638
#4641
#4644
#4645
#4651
#4652
#4654
#4658
#4660
#4662
#4663
#4665
#467
#47
#471
#478
#48
#486
#487
#488
#489
#49
#493
#494
#495
#496
#499
#5
#50
#500
#501
#503
#507
#508
#51
#510
#511
#512
#518
#52
#521
#523
#526
#527
#528
#529
#53
#532
#533
#534
#536
#54
#542
#544
#547
#55
#552
#554
#555
#56
#560
#564
#567
#568
#57
#573
#574
#577
#578
#579
#58
#580
#581
#582
#584
#586
#587
#588
#59
#597
#599
#6
#60
#601
#602
#603
#604
#607
#608
#61
#616
#62
#63
#630
#631
#635
#636
#639
#64
#645
#65
#652
#66
#661
#668
#669
#67
#670
#672
#673
#676
#68
#682
#687
#689
#689
#69
#690
#693
#694
#695
#696
#698
#699
#7
#70
#700
#701
#706
#707
#71
#710
#716
#717
#718
#72
#73
#737
#74
#740
#743
#744
#745
#747
#75
#753
#76
#765
#766
#769
#77
#773
#774
#776
#777
#78
#782
#784
#785
#786
#788
#789
#79
#791
#793
#794
#797
#798
#799
#8
#80
#800
#802
#804
#805
#806
#808
#809
#81
#810
#817
#818
#82
#820
#824
#825
#83
#830
#831
#833
#834
#835
#838
#839
#84
#841
#843
#844
#845
#847
#85
#853
#854
#855
#856
#857
#858
#86
#860
#866
#867
#869
#87
#871
#874
#875
#876
#877
#878
#879
#88
#880
#882
#883
#884
#885
#886
#887
#888
#889
#89
#898
#9
#90
#902
#906
#907
#91
#910
#911
#912
#913
#914
#915
#916
#917
#918
#919
#92
#920
#921
#922
#923
#924
#925
#927
#928
#929
#93
#931
#938
#94
#941
#943
#945
#948
#95
#951
#957
#96
#964
#965
#966
#967
#968
#969
#97
#971
#973
#974
#975
#976
#977
#98
#986
#99
#998
magic_pdf-0.1.0-released
magic_pdf-0.1.1-released
magic_pdf-0.1.2-released
magic_pdf-0.1.3-released
magic_pdf-0.1.4-released
magic_pdf-0.10.0-released
magic_pdf-0.10.1-released
magic_pdf-0.10.2-released
magic_pdf-0.10.3-released
magic_pdf-0.10.4-released
magic_pdf-0.10.5-released
magic_pdf-0.10.6-released
magic_pdf-0.2.0-released
magic_pdf-0.2.1-released
magic_pdf-0.3.0-released
magic_pdf-0.3.1-released
magic_pdf-0.3.10-released
magic_pdf-0.3.11-released
magic_pdf-0.3.12-released
magic_pdf-0.3.13-released
magic_pdf-0.3.14-released
magic_pdf-0.3.15-released
magic_pdf-0.3.16-released
magic_pdf-0.3.17-released
magic_pdf-0.3.18-released
magic_pdf-0.3.19-released
magic_pdf-0.3.2-released
magic_pdf-0.3.20-released
magic_pdf-0.3.21-released
magic_pdf-0.3.22-released
magic_pdf-0.3.23-released
magic_pdf-0.3.24-released
magic_pdf-0.3.25-released
magic_pdf-0.3.26-released
magic_pdf-0.3.27-released
magic_pdf-0.3.28-released
magic_pdf-0.3.29-released
magic_pdf-0.3.3-released
magic_pdf-0.3.30-released
magic_pdf-0.3.31-released
magic_pdf-0.3.32-released
magic_pdf-0.3.33-released
magic_pdf-0.3.34-released
magic_pdf-0.3.35-released
magic_pdf-0.3.36-released
magic_pdf-0.3.37-released
magic_pdf-0.3.4-released
magic_pdf-0.3.5-released
magic_pdf-0.3.6-released
magic_pdf-0.3.7-released
magic_pdf-0.3.8-released
magic_pdf-0.3.9-released
magic_pdf-0.4.0-released
magic_pdf-0.4.1-released
magic_pdf-0.4.10-released
magic_pdf-0.4.11-released
magic_pdf-0.4.12-released
magic_pdf-0.4.13-released
magic_pdf-0.4.14-released
magic_pdf-0.4.15-released
magic_pdf-0.4.16-released
magic_pdf-0.4.17-released
magic_pdf-0.4.18-released
magic_pdf-0.4.19-released
magic_pdf-0.4.2-released
magic_pdf-0.4.20-released
magic_pdf-0.4.21-released
magic_pdf-0.4.22-released
magic_pdf-0.4.23-released
magic_pdf-0.4.24-released
magic_pdf-0.4.25-released
magic_pdf-0.4.26-released
magic_pdf-0.4.27-released
magic_pdf-0.4.28-released
magic_pdf-0.4.3-released
magic_pdf-0.4.5-released
magic_pdf-0.4.6-released
magic_pdf-0.4.7-released
magic_pdf-0.4.8-released
magic_pdf-0.4.9-released
magic_pdf-0.5.0-released
magic_pdf-0.5.1-released
magic_pdf-0.5.10-released
magic_pdf-0.5.11-released
magic_pdf-0.5.12-released
magic_pdf-0.5.13-released
magic_pdf-0.5.2-released
magic_pdf-0.5.3-released
magic_pdf-0.5.4-released
magic_pdf-0.5.5-released
magic_pdf-0.5.6-released
magic_pdf-0.5.7-released
magic_pdf-0.5.8-released
magic_pdf-0.5.9-released
magic_pdf-0.6.0-released
magic_pdf-0.6.1-released
magic_pdf-0.6.2b1-released
magic_pdf-0.7.0a1-released
magic_pdf-0.7.0b1-released
magic_pdf-0.7.1-released
magic_pdf-0.8.0-released
magic_pdf-0.8.1-released
magic_pdf-0.8.1-update-docs
magic_pdf-0.9.0-released
magic_pdf-0.9.1-released
magic_pdf-0.9.2-released
magic_pdf-0.9.3-released
magic_pdf-1.0.0-released
magic_pdf-1.0.1-released
magic_pdf-1.1.0-released
magic_pdf-1.2.0-released
magic_pdf-1.2.1-released
magic_pdf-1.2.2-released
magic_pdf-1.3.0-released
magic_pdf-1.3.1-released
magic_pdf-1.3.10-released
magic_pdf-1.3.11-released
magic_pdf-1.3.12-released
magic_pdf-1.3.2-released
magic_pdf-1.3.3-released
magic_pdf-1.3.4-released
magic_pdf-1.3.5-released
magic_pdf-1.3.6-released
magic_pdf-1.3.7-released
magic_pdf-1.3.8-released
magic_pdf-1.3.9-released
mineru-2.0.0-released
mineru-2.0.1-released
mineru-2.0.2-released
mineru-2.0.3-released
mineru-2.0.4-released
mineru-2.0.5-released
mineru-2.0.6-released
mineru-2.1.0-released
mineru-2.1.1-released
mineru-2.1.10-released
mineru-2.1.11-released
mineru-2.1.2-released
mineru-2.1.3-released
mineru-2.1.4-released
mineru-2.1.5-released
mineru-2.1.6-released
mineru-2.1.7-released
mineru-2.1.8-released
mineru-2.1.9-released
mineru-2.2.0-released
mineru-2.2.1-released
mineru-2.2.2-released
mineru-2.5.0-released
mineru-2.5.1-released
mineru-2.5.2-released
mineru-2.5.3-released
mineru-2.5.4-released
mineru-2.6.0-released
mineru-2.6.1-released
mineru-2.6.2-released
mineru-2.6.3-released
mineru-2.6.4-released
mineru-2.6.5-released
mineru-2.6.6-released
mineru-2.6.7-released
mineru-2.6.8-released
mineru-2.7.0-released
mineru-2.7.1-released
mineru-2.7.2-released
mineru-2.7.3-released
mineru-2.7.4-released
mineru-2.7.5-released
mineru-2.7.6-released
Select branches
Hide Pull Requests
add_docx
cla
copilot/analyze-issue-4433
dev
gh-pages
master
realese-0.8.0
release-0.10.0
release-0.10.1
release-0.10.2
release-0.10.3
release-0.10.4
release-0.10.5
release-0.10.6
release-0.9.0
release-0.9.1
release-0.9.2
release-0.9.3
release-1.0.0
release-1.1.0
release-1.2.0
release-1.2.1
release-1.2.2
release-1.3.0
release-1.3.1
release-1.3.10
release-1.3.11
release-1.3.12
release-1.3.2
release-1.3.3
release-1.3.4
release-1.3.5
release-1.3.6
release-1.3.7
release-1.3.8
release-1.3.9
release-2.0.0
release-2.0.1
release-2.0.2
release-2.0.3
release-2.0.4
release-2.0.5
release-2.0.6
release-2.1.0
release-2.1.1
release-2.1.10
release-2.1.2
release-2.1.3
release-2.1.4
release-2.1.5
release-2.1.6
release-2.1.7
release-2.1.8
release-2.1.9
release-2.2.0
release-2.2.1
release-2.2.2
release-2.5.0
release-2.5.1
release-2.5.2
release-2.5.3
release-2.5.4
release-2.6.0
release-2.6.1
release-2.6.2
release-2.6.3
release-2.6.4
release-2.6.5
release-2.6.6
release-2.6.7
release-2.7.0
release-2.7.1
release-2.7.2
release-2.7.3
release-2.7.4
release-2.7.6
#1
#10
#100
#1001
#1006
#101
#1010
#1011
#1012
#1013
#1016
#1018
#102
#1024
#1027
#103
#1036
#104
#1045
#1046
#1047
#1048
#1049
#105
#1050
#1052
#1053
#1054
#1056
#1058
#1059
#106
#1060
#1061
#1062
#1063
#1064
#1065
#1066
#107
#1071
#1074
#1075
#1076
#1077
#108
#1082
#1086
#1088
#1089
#1094
#1095
#1098
#1099
#11
#110
#1100
#1101
#1102
#1104
#1105
#1106
#111
#1110
#1112
#1113
#1116
#1117
#1119
#112
#1120
#1121
#113
#1130
#1132
#1134
#1135
#1136
#1137
#1138
#1139
#114
#1140
#1141
#1143
#1147
#115
#1152
#1153
#1154
#1156
#116
#1164
#1165
#1166
#1167
#117
#1170
#1177
#1178
#118
#119
#1193
#1198
#12
#120
#1201
#1207
#1208
#1209
#1211
#1212
#1213
#1214
#1215
#1216
#1218
#1222
#1224
#1228
#1231
#1232
#1238
#1239
#1243
#1247
#1252
#1255
#1256
#1257
#1258
#1259
#1260
#1261
#1262
#1263
#1264
#1265
#1266
#1267
#1268
#1272
#1275
#1276
#1277
#1278
#1280
#1281
#1284
#1289
#1291
#1292
#1299
#1299
#13
#130
#1301
#1304
#131
#1311
#1312
#1313
#1318
#132
#1321
#1322
#1323
#1325
#1328
#1329
#133
#1330
#1336
#1337
#1338
#1352
#1362
#1365
#1370
#1379
#138
#1380
#1386
#139
#1397
#1398
#14
#140
#141
#1412
#1414
#1419
#1420
#1421
#1422
#1423
#1424
#1425
#1426
#1427
#1428
#1429
#1430
#1431
#1436
#1437
#1438
#1439
#1440
#1448
#1449
#1450
#1451
#1452
#1453
#1454
#1459
#1460
#1462
#1464
#1465
#1468
#1469
#1470
#1471
#1472
#1473
#1474
#1475
#1476
#1477
#1479
#1481
#1482
#1483
#1484
#1486
#1487
#1490
#1492
#1493
#1494
#1495
#1496
#1497
#1498
#1499
#15
#1500
#1510
#1511
#1512
#1513
#1515
#1516
#1517
#1520
#1521
#1531
#1532
#1533
#1534
#1535
#1537
#1538
#1542
#1543
#1546
#1547
#1549
#1550
#1551
#1553
#1554
#1556
#1557
#1565
#1567
#1569
#1570
#1571
#1578
#1580
#1582
#1588
#1590
#1591
#1592
#1593
#1594
#1595
#16
#160
#1601
#1602
#1606
#1607
#1612
#1613
#1614
#1616
#1617
#1618
#1619
#1621
#1622
#1631
#1636
#1648
#1661
#1664
#1672
#168
#1682
#1683
#1689
#169
#1693
#17
#1701
#1703
#1704
#171
#1711
#172
#1734
#1737
#1738
#1743
#1748
#1750
#1753
#1757
#1759
#1760
#1761
#1762
#1767
#1769
#1770
#1771
#1776
#1777
#1778
#1785
#1787
#1788
#1789
#1790
#1792
#1793
#1799
#18
#1810
#1810
#1821
#1822
#1823
#1824
#1825
#1827
#1828
#1829
#1838
#1839
#1841
#1863
#1883
#189
#1894
#1897
#19
#1906
#1910
#1919
#1944
#1948
#1950
#1955
#1956
#1957
#1958
#1959
#1970
#1974
#1975
#1980
#1981
#1982
#1984
#1985
#1986
#2
#20
#2003
#2004
#2010
#2062
#2063
#2064
#2065
#2066
#2069
#2070
#2071
#2072
#2073
#2074
#2077
#2078
#2079
#2080
#2081
#2082
#2083
#2084
#2086
#2087
#2088
#2089
#2090
#2091
#2092
#2093
#21
#2114
#2115
#2124
#2125
#2126
#2128
#214
#2142
#2144
#2145
#2146
#2147
#2148
#215
#2151
#2152
#2153
#2154
#2155
#2156
#2157
#2166
#2170
#2172
#2173
#2174
#2177
#2178
#2189
#2193
#2194
#2195
#2196
#2197
#2198
#2199
#22
#2201
#2205
#2206
#2207
#2208
#2214
#2215
#2217
#2220
#2223
#2224
#2225
#2226
#2227
#2231
#2232
#2234
#2239
#2240
#2250
#2251
#2252
#2253
#2254
#2255
#2256
#2264
#2265
#2266
#2267
#2269
#2273
#2274
#2297
#2298
#23
#231
#2311
#2314
#2315
#2316
#2352
#2353
#2354
#2355
#2356
#2365
#2367
#2380
#2381
#2382
#2383
#2384
#2385
#2386
#2387
#2388
#2389
#2395
#24
#2402
#2403
#2404
#2405
#2406
#2410
#2411
#2423
#2429
#2437
#2440
#2446
#2449
#2450
#2451
#2464
#2465
#2466
#2467
#2468
#2487
#25
#2501
#2505
#2506
#2510
#2511
#2512
#2513
#2514
#2519
#2526
#2526
#2536
#2550
#2562
#2566
#2570
#2571
#2575
#2578
#258
#2591
#26
#2609
#2611
#2613
#2614
#2616
#2620
#2622
#2623
#2624
#2625
#2626
#2627
#2628
#2629
#2630
#2631
#2632
#2633
#2634
#2635
#2636
#2638
#2639
#264
#2644
#2645
#2646
#2648
#2649
#2650
#2652
#2653
#2654
#2655
#2656
#2659
#2660
#2667
#2668
#2675
#2676
#2679
#2680
#2681
#2686
#2688
#2691
#2695
#2696
#2698
#27
#2703
#2704
#2705
#2706
#2707
#2719
#2721
#2722
#2727
#2729
#2733
#2736
#2740
#2742
#2751
#2752
#2753
#2754
#2755
#2756
#2757
#2758
#2763
#2767
#2768
#2777
#2780
#2783
#2787
#2788
#2789
#2790
#28
#2813
#2814
#2815
#2824
#2825
#2826
#2831
#2833
#2834
#2836
#2837
#284
#2840
#2842
#2843
#2844
#2845
#2850
#2852
#2854
#2857
#2858
#2859
#286
#2861
#2870
#2873
#2878
#2879
#2881
#2887
#2889
#2890
#2891
#2892
#2893
#2894
#2895
#2896
#2897
#2898
#2899
#29
#2900
#2901
#2903
#2904
#2905
#2906
#2907
#2908
#291
#2914
#2923
#2931
#2932
#2937
#2940
#2941
#2943
#2948
#2975
#2989
#2990
#3
#30
#3016
#3017
#3018
#3019
#3020
#3023
#3024
#3026
#3028
#3029
#3030
#3032
#3033
#3034
#3035
#3036
#3037
#3038
#3039
#3040
#3041
#3042
#3043
#3044
#3045
#3046
#3048
#3052
#3053
#3054
#3056
#3057
#306
#3060
#3061
#3062
#3063
#3064
#3065
#3067
#3068
#3069
#3070
#3071
#3072
#3073
#3074
#3075
#3076
#3077
#3091
#3093
#3095
#3096
#3099
#31
#3100
#3105
#3124
#3125
#3126
#3128
#3129
#3137
#3138
#3139
#314
#3140
#3141
#3143
#3144
#3145
#3149
#3150
#3151
#3154
#3155
#3156
#3158
#3167
#3172
#3173
#3174
#3175
#3181
#3182
#3183
#3184
#3186
#3187
#3189
#3190
#3196
#3197
#3198
#32
#3201
#3213
#3214
#3218
#3222
#3224
#3228
#3229
#3237
#3239
#3240
#3241
#3242
#3269
#3275
#3277
#3281
#329
#3291
#33
#3314
#3315
#3321
#3324
#3325
#3335
#3336
#3339
#3340
#3354
#3361
#3365
#3371
#3372
#3374
#3382
#3383
#3384
#3388
#3396
#3397
#34
#3405
#3406
#3407
#3419
#3420
#3421
#3423
#3424
#3425
#3426
#3427
#3428
#3429
#3435
#3437
#3438
#3442
#3448
#3449
#3450
#3451
#3473
#3477
#3489
#3490
#3498
#3499
#35
#350
#3501
#3502
#3503
#3504
#3505
#3506
#3507
#3508
#3509
#3510
#3511
#3512
#3513
#3514
#3515
#3516
#3517
#3523
#3527
#3529
#3532
#3533
#3534
#3535
#354
#3544
#3545
#3546
#3549
#355
#3550
#3551
#3552
#3553
#3554
#3555
#3556
#3557
#3558
#3563
#36
#3606
#3607
#3608
#3609
#3610
#3615
#3619
#3630
#3635
#3649
#3650
#3651
#3671
#3672
#3688
#3697
#3698
#3699
#37
#3700
#3701
#3703
#3706
#3706
#3707
#3708
#3709
#371
#3711
#3722
#3723
#3737
#3739
#374
#3740
#3742
#3748
#3750
#3752
#3754
#3755
#3756
#3760
#3761
#3762
#3766
#3767
#3768
#3769
#3770
#3779
#379
#38
#3803
#3804
#3805
#3806
#3812
#3814
#3819
#3820
#3821
#3822
#3823
#3824
#3825
#3828
#3829
#3830
#3831
#3833
#3834
#3835
#3836
#3837
#3841
#3842
#3851
#3854
#3855
#386
#3860
#3870
#3873
#3880
#3886
#3887
#3888
#3891
#3892
#3895
#3897
#3898
#3899
#39
#3900
#3902
#3903
#3904
#3905
#3918
#3919
#3931
#3932
#3933
#3934
#3946
#3950
#396
#3963
#3964
#3966
#3967
#397
#3972
#3974
#3975
#3976
#398
#3980
#3990
#3995
#3997
#4
#40
#400
#401
#404
#4040
#4046
#4062
#4063
#4065
#4066
#4067
#4068
#4069
#4070
#4073
#4074
#4076
#4077
#4078
#4081
#4082
#4083
#409
#4096
#4098
#4099
#41
#410
#4100
#4101
#4102
#4103
#4104
#4105
#4106
#4112
#4114
#4115
#4133
#4137
#4140
#4141
#4144
#417
#417
#4170
#4171
#4172
#4175
#4176
#4177
#4178
#4179
#418
#4192
#4193
#4194
#4196
#42
#4231
#4239
#4241
#4244
#4267
#4268
#4270
#4271
#4272
#4273
#4277
#4283
#4284
#4285
#4286
#4287
#4292
#4293
#4299
#43
#4301
#4303
#4304
#4305
#4306
#4308
#4309
#4310
#4318
#4330
#4349
#4353
#4357
#4358
#4359
#4365
#4367
#4368
#4386
#4388
#44
#4403
#4404
#4405
#4406
#4407
#4408
#4409
#4410
#4411
#4417
#4418
#4419
#4420
#4421
#4430
#4432
#4434
#4435
#4438
#4446
#4448
#4450
#4451
#4452
#4453
#4454
#4455
#4456
#4457
#4458
#4459
#4468
#447
#4471
#4473
#4474
#4475
#448
#4498
#4499
#45
#4500
#4503
#4504
#4505
#4507
#4508
#4513
#4518
#4523
#4525
#4526
#4544
#4555
#4559
#4560
#4564
#4569
#4575
#458
#4584
#4586
#4592
#4593
#4595
#4596
#46
#4622
#4626
#463
#4631
#4635
#4636
#4637
#4638
#4641
#4644
#4645
#4651
#4652
#4654
#4658
#4660
#4662
#4663
#4665
#467
#47
#471
#478
#48
#486
#487
#488
#489
#49
#493
#494
#495
#496
#499
#5
#50
#500
#501
#503
#507
#508
#51
#510
#511
#512
#518
#52
#521
#523
#526
#527
#528
#529
#53
#532
#533
#534
#536
#54
#542
#544
#547
#55
#552
#554
#555
#56
#560
#564
#567
#568
#57
#573
#574
#577
#578
#579
#58
#580
#581
#582
#584
#586
#587
#588
#59
#597
#599
#6
#60
#601
#602
#603
#604
#607
#608
#61
#616
#62
#63
#630
#631
#635
#636
#639
#64
#645
#65
#652
#66
#661
#668
#669
#67
#670
#672
#673
#676
#68
#682
#687
#689
#689
#69
#690
#693
#694
#695
#696
#698
#699
#7
#70
#700
#701
#706
#707
#71
#710
#716
#717
#718
#72
#73
#737
#74
#740
#743
#744
#745
#747
#75
#753
#76
#765
#766
#769
#77
#773
#774
#776
#777
#78
#782
#784
#785
#786
#788
#789
#79
#791
#793
#794
#797
#798
#799
#8
#80
#800
#802
#804
#805
#806
#808
#809
#81
#810
#817
#818
#82
#820
#824
#825
#83
#830
#831
#833
#834
#835
#838
#839
#84
#841
#843
#844
#845
#847
#85
#853
#854
#855
#856
#857
#858
#86
#860
#866
#867
#869
#87
#871
#874
#875
#876
#877
#878
#879
#88
#880
#882
#883
#884
#885
#886
#887
#888
#889
#89
#898
#9
#90
#902
#906
#907
#91
#910
#911
#912
#913
#914
#915
#916
#917
#918
#919
#92
#920
#921
#922
#923
#924
#925
#927
#928
#929
#93
#931
#938
#94
#941
#943
#945
#948
#95
#951
#957
#96
#964
#965
#966
#967
#968
#969
#97
#971
#973
#974
#975
#976
#977
#98
#986
#99
#998
magic_pdf-0.1.0-released
magic_pdf-0.1.1-released
magic_pdf-0.1.2-released
magic_pdf-0.1.3-released
magic_pdf-0.1.4-released
magic_pdf-0.10.0-released
magic_pdf-0.10.1-released
magic_pdf-0.10.2-released
magic_pdf-0.10.3-released
magic_pdf-0.10.4-released
magic_pdf-0.10.5-released
magic_pdf-0.10.6-released
magic_pdf-0.2.0-released
magic_pdf-0.2.1-released
magic_pdf-0.3.0-released
magic_pdf-0.3.1-released
magic_pdf-0.3.10-released
magic_pdf-0.3.11-released
magic_pdf-0.3.12-released
magic_pdf-0.3.13-released
magic_pdf-0.3.14-released
magic_pdf-0.3.15-released
magic_pdf-0.3.16-released
magic_pdf-0.3.17-released
magic_pdf-0.3.18-released
magic_pdf-0.3.19-released
magic_pdf-0.3.2-released
magic_pdf-0.3.20-released
magic_pdf-0.3.21-released
magic_pdf-0.3.22-released
magic_pdf-0.3.23-released
magic_pdf-0.3.24-released
magic_pdf-0.3.25-released
magic_pdf-0.3.26-released
magic_pdf-0.3.27-released
magic_pdf-0.3.28-released
magic_pdf-0.3.29-released
magic_pdf-0.3.3-released
magic_pdf-0.3.30-released
magic_pdf-0.3.31-released
magic_pdf-0.3.32-released
magic_pdf-0.3.33-released
magic_pdf-0.3.34-released
magic_pdf-0.3.35-released
magic_pdf-0.3.36-released
magic_pdf-0.3.37-released
magic_pdf-0.3.4-released
magic_pdf-0.3.5-released
magic_pdf-0.3.6-released
magic_pdf-0.3.7-released
magic_pdf-0.3.8-released
magic_pdf-0.3.9-released
magic_pdf-0.4.0-released
magic_pdf-0.4.1-released
magic_pdf-0.4.10-released
magic_pdf-0.4.11-released
magic_pdf-0.4.12-released
magic_pdf-0.4.13-released
magic_pdf-0.4.14-released
magic_pdf-0.4.15-released
magic_pdf-0.4.16-released
magic_pdf-0.4.17-released
magic_pdf-0.4.18-released
magic_pdf-0.4.19-released
magic_pdf-0.4.2-released
magic_pdf-0.4.20-released
magic_pdf-0.4.21-released
magic_pdf-0.4.22-released
magic_pdf-0.4.23-released
magic_pdf-0.4.24-released
magic_pdf-0.4.25-released
magic_pdf-0.4.26-released
magic_pdf-0.4.27-released
magic_pdf-0.4.28-released
magic_pdf-0.4.3-released
magic_pdf-0.4.5-released
magic_pdf-0.4.6-released
magic_pdf-0.4.7-released
magic_pdf-0.4.8-released
magic_pdf-0.4.9-released
magic_pdf-0.5.0-released
magic_pdf-0.5.1-released
magic_pdf-0.5.10-released
magic_pdf-0.5.11-released
magic_pdf-0.5.12-released
magic_pdf-0.5.13-released
magic_pdf-0.5.2-released
magic_pdf-0.5.3-released
magic_pdf-0.5.4-released
magic_pdf-0.5.5-released
magic_pdf-0.5.6-released
magic_pdf-0.5.7-released
magic_pdf-0.5.8-released
magic_pdf-0.5.9-released
magic_pdf-0.6.0-released
magic_pdf-0.6.1-released
magic_pdf-0.6.2b1-released
magic_pdf-0.7.0a1-released
magic_pdf-0.7.0b1-released
magic_pdf-0.7.1-released
magic_pdf-0.8.0-released
magic_pdf-0.8.1-released
magic_pdf-0.8.1-update-docs
magic_pdf-0.9.0-released
magic_pdf-0.9.1-released
magic_pdf-0.9.2-released
magic_pdf-0.9.3-released
magic_pdf-1.0.0-released
magic_pdf-1.0.1-released
magic_pdf-1.1.0-released
magic_pdf-1.2.0-released
magic_pdf-1.2.1-released
magic_pdf-1.2.2-released
magic_pdf-1.3.0-released
magic_pdf-1.3.1-released
magic_pdf-1.3.10-released
magic_pdf-1.3.11-released
magic_pdf-1.3.12-released
magic_pdf-1.3.2-released
magic_pdf-1.3.3-released
magic_pdf-1.3.4-released
magic_pdf-1.3.5-released
magic_pdf-1.3.6-released
magic_pdf-1.3.7-released
magic_pdf-1.3.8-released
magic_pdf-1.3.9-released
mineru-2.0.0-released
mineru-2.0.1-released
mineru-2.0.2-released
mineru-2.0.3-released
mineru-2.0.4-released
mineru-2.0.5-released
mineru-2.0.6-released
mineru-2.1.0-released
mineru-2.1.1-released
mineru-2.1.10-released
mineru-2.1.11-released
mineru-2.1.2-released
mineru-2.1.3-released
mineru-2.1.4-released
mineru-2.1.5-released
mineru-2.1.6-released
mineru-2.1.7-released
mineru-2.1.8-released
mineru-2.1.9-released
mineru-2.2.0-released
mineru-2.2.1-released
mineru-2.2.2-released
mineru-2.5.0-released
mineru-2.5.1-released
mineru-2.5.2-released
mineru-2.5.3-released
mineru-2.5.4-released
mineru-2.6.0-released
mineru-2.6.1-released
mineru-2.6.2-released
mineru-2.6.3-released
mineru-2.6.4-released
mineru-2.6.5-released
mineru-2.6.6-released
mineru-2.6.7-released
mineru-2.6.8-released
mineru-2.7.0-released
mineru-2.7.1-released
mineru-2.7.2-released
mineru-2.7.3-released
mineru-2.7.4-released
mineru-2.7.5-released
mineru-2.7.6-released
-
6a75b39940
feat: add support for MUSA and NPU devices in device management functions
myhloli
2026-01-22 15:45:26 +08:00 -
78e83d00a7
feat: refine DOCX processing to adjust title level handling and streamline list item references
myhloli
2026-01-21 18:48:40 +08:00 -
7bcd3afb86
feat: refactor DOCX processing to unify block type handling for captions and list items
myhloli
2026-01-21 17:21:34 +08:00 -
517257e058
feat: enhance DOCX text processing to include equations and hyperlinks in content generation
myhloli
2026-01-21 17:04:22 +08:00 -
313ec8afa0
feat: add MinerU configuration options for vlm/hybrid backend
myhloli
2026-01-21 11:16:29 +08:00 -
ee4065ffd5
feat: refactor line object construction in DOCX processing to streamline block handling
myhloli
2026-01-21 11:08:19 +08:00 -
940289d083
feat: add Enflame setup guide and Dockerfile for GCU support
myhloli
2026-01-20 18:55:29 +08:00 -
21c9267a93
feat: enhance memory management for GCU device support in clean_memory function
myhloli
2026-01-20 17:34:27 +08:00 -
10d996d14e
feat: add 2.7.2 release notes with cross-page table merging optimization and new device support
myhloli
2026-01-20 17:26:21 +08:00 -
1d697c20bf
feat: update region area calculation for compatibility with skimage version 0.26.0
myhloli
2026-01-20 17:07:53 +08:00 -
333f6d3a32
Merge branch 'opendatalab:dev' into dev
Xiaomeng Zhao
2026-01-20 16:26:22 +08:00 -
7620bd4ccc
feat: add GCU device support for bf16 and memory calculations
myhloli
2026-01-20 16:06:20 +08:00 -
5026faa458
feat: update DOCX processing to change test document path and enhance chart handling with improved content structure
myhloli
2026-01-19 20:18:24 +08:00 -
8381e61f0c
feat: update DOCX processing to change test document path and enhance chart handling with improved content structure
myhloli
2026-01-19 18:37:56 +08:00 -
a8c4b6c2fe
Merge pull request #4388 from myhloli/add_docx
Xiaomeng Zhao
2026-01-19 17:02:34 +08:00 -
a0b0eb704c
Merge branch 'opendatalab:add_docx' into add_docx
Xiaomeng Zhao
2026-01-19 17:01:40 +08:00 -
1ed570a205
Merge pull request #4386 from Sidney233/add_docx
Xiaomeng Zhao
2026-01-19 17:00:58 +08:00 -
21ebf6bdb1
Merge branch 'opendatalab:add_docx' into add_docx
Sidney233
2026-01-19 16:28:13 +08:00 -
11513dd44c
feat: 添加图表处理excel表格
Sidney233
2026-01-19 16:26:27 +08:00 -
5706011633
feat: update device handling in YOLO model initialization for improved compatibility
myhloli
2026-01-19 15:58:10 +08:00 -
df07baea6c
feat: enhance table merging logic with effective column calculations and visual consistency checks
myhloli
2026-01-16 18:58:10 +08:00 -
c73c1d3847
feat: add support for Chinese continuation marker in table merging logic
myhloli
2026-01-16 17:17:47 +08:00 -
32592cd27f
feat: enhance DOCX header and footer processing by adding deduplication for inline equations and hyperlinks
myhloli
2026-01-16 17:16:51 +08:00 -
9137f84591
feat: enhance DOCX header and footer processing by adding deduplication for inline equations and hyperlinks
myhloli
2026-01-16 16:14:04 +08:00 -
56c3bb3570
feat: enhance DOCX processing by adding hyperlink support and improving text formatting with equations
myhloli
2026-01-16 16:04:45 +08:00 -
23e3a73f33
feat: enhance DOCX processing by adding hyperlink support and improving text formatting with equations
myhloli
2026-01-16 15:22:30 +08:00 -
e7c67a95b6
feat: enhance DOCX processing by adding main execution block and improving text content handling with equations
myhloli
2026-01-15 20:01:22 +08:00 -
ea6bb2ede9
feat: update result_to_middle_json function to streamline parameters and enhance JSON output structure
myhloli
2026-01-14 19:50:38 +08:00 -
c6543b4aeb
Merge pull request #4368 from myhloli/dev
Xiaomeng Zhao
2026-01-14 17:01:59 +08:00 -
5116192d32
feat: replace Gradio app script with iframe for improved integration
myhloli
2026-01-14 17:01:11 +08:00 -
810717b42a
feat: refactor DOCX processing by consolidating image handling and introducing MagicModel for block management
myhloli
2026-01-14 16:56:49 +08:00 -
7554127ff7
Merge pull request #4367 from Sidney233/add_docx
Xiaomeng Zhao
2026-01-14 16:47:31 +08:00 -
201ba86072
Merge pull request #4365 from tommygood/docs/fix-typos-spans-pdf
Xiaomeng Zhao
2026-01-14 16:44:38 +08:00 -
087d3686c5
@tommygood has signed the CLA in opendatalab/MinerU#4365
github-actions[bot]
2026-01-14 08:06:04 +00:00 -
d629ede38a
修复list_item重复统计,过滤掉内容为空的block,页眉页脚的纯数字内容不添加进page,caption识别
Sidney233
2026-01-14 16:04:47 +08:00 -
11252a5636
docs: correct file naming format to use '_span.pdf'
tommygood
2026-01-14 15:48:31 +08:00 -
db40932e6d
Merge pull request #4359 from opendatalab/dev
Xiaomeng Zhao
2026-01-13 19:51:36 +08:00 -
03698c656e
Merge pull request #4358 from myhloli/dev
Xiaomeng Zhao
2026-01-13 19:50:19 +08:00 -
48ded6b06c
feat: add Hygon entry to acceleration cards list
myhloli
2026-01-13 19:47:08 +08:00 -
4e66217909
Merge pull request #4357 from myhloli/dev
Xiaomeng Zhao
2026-01-13 19:46:07 +08:00 -
bdec40487e
feat: add Dockerfile for vLLM inference environment and Hygon platform documentation
myhloli
2026-01-13 19:45:18 +08:00 -
ec9b05003d
fix: add support for ellipsis continuation marker in table merging logic
myhloli
2026-01-13 15:50:15 +08:00 -
6501ad878d
Merge pull request #4353 from myhloli/add_docx
Xiaomeng Zhao
2026-01-13 15:15:15 +08:00 -
6c8fa9776f
feat: simplify element handling in DOCX processing by removing unnecessary references and improving structure
myhloli
2026-01-13 15:13:38 +08:00 -
1d93aa8ab9
Merge branch 'opendatalab:add_docx' into add_docx
Xiaomeng Zhao
2026-01-12 19:08:34 +08:00 -
9aba297545
Merge pull request #4349 from Sidney233/add_docx
Xiaomeng Zhao
2026-01-12 19:08:01 +08:00 -
dec84a9b5a
feat: disable model output dumping in DOCX processing for improved performance
myhloli
2026-01-12 18:33:13 +08:00 -
cbe39f4a5a
Merge branch 'opendatalab:add_docx' into add_docx
Sidney233
2026-01-12 17:10:51 +08:00 -
e042384953
分节与页眉页脚处理完成
Sidney233
2026-01-12 17:08:37 +08:00 -
a644a8a074
分节处理问题的TODO
Sidney233
2026-01-09 17:39:16 +08:00 -
c10f248721
Merge pull request #4330 from opendatalab/master
Xiaomeng Zhao
2026-01-09 12:04:07 +08:00 -
30c5d10e05
Archive MinerU Project List and update notes
Xiaomeng Zhao
2026-01-09 12:02:21 +08:00 -
4c3be9273c
Fix typo in README_zh-CN.md
Xiaomeng Zhao
2026-01-09 12:00:26 +08:00 -
1833163b97
Mark MinerU project as archived in README
Xiaomeng Zhao
2026-01-09 12:00:10 +08:00 -
eb55029adf
Merge pull request #4318 from myhloli/dev
Xiaomeng Zhao
2026-01-07 20:27:38 +08:00 -
2eef53a9f0
fix: improve continuation marker handling in table caption merging logic
myhloli
2026-01-07 20:17:13 +08:00 -
9e6e2bde85
fix: refine caption merging logic to improve handling of continuation markers
myhloli
2026-01-07 20:05:26 +08:00 -
c73e93bec0
fix: enhance table merging logic to handle footnotes more effectively
myhloli
2026-01-07 19:50:46 +08:00 -
07db6839b8
feat: refactor logging to use loguru and add BlockType and ContentBlock classes for structured content handling
myhloli
2026-01-07 19:24:18 +08:00 -
17394682e2
feat: add lxml dependency for enhanced XML processing in DOCX handling
myhloli
2026-01-07 14:22:57 +08:00 -
97bd2a2b94
Merge pull request #4310 from myhloli/add_docx
Xiaomeng Zhao
2026-01-07 10:38:52 +08:00 -
ad175df3d2
feat: enhance DOCX processing by refining image handling and improving logging for inference timing
myhloli
2026-01-06 20:04:06 +08:00 -
0cbe965d97
feat: enhance DOCX processing by adding support for office file types and refactoring related functions
myhloli
2026-01-06 19:49:40 +08:00 -
74f6d4d0e7
Merge pull request #4309 from myhloli/add_docx
Xiaomeng Zhao
2026-01-06 17:19:32 +08:00 -
648fb1f7cf
feat: update array formatting in latex_dict.py for improved LaTeX output
myhloli
2026-01-06 17:19:01 +08:00 -
b6fc07cf9e
feat: replace logging with loguru for improved logging functionality in OMML processing
myhloli
2026-01-06 17:11:06 +08:00 -
57be6926a9
feat: enhance OMML processing with additional LaTeX functions and improve unicode handling
myhloli
2026-01-06 16:22:05 +08:00 -
7abcfa39a0
Merge pull request #4308 from myhloli/add_docx
Xiaomeng Zhao
2026-01-06 16:17:19 +08:00 -
6f76664141
feat: refactor DOCX utilities and update dependencies for improved processing
myhloli
2026-01-06 16:15:44 +08:00 -
1dfbea157a
Merge pull request #4306 from opendatalab/master
Xiaomeng Zhao
2026-01-06 15:03:27 +08:00 -
96840733c4
Update version.py with new version
myhloli
2026-01-06 06:55:29 +00:00 -
45f8ad1d5c
Merge pull request #4305 from opendatalab/release-2.7.1
mineru-2.7.1-released
Xiaomeng Zhao
2026-01-06 14:47:23 +08:00 -
b69191ba2b
Merge pull request #4304 from opendatalab/dev
release-2.7.1
Xiaomeng Zhao
2026-01-06 14:46:18 +08:00 -
0028514ced
Merge pull request #4303 from myhloli/dev
Xiaomeng Zhao
2026-01-06 14:45:35 +08:00 -
8d8daf6851
fix: add qwen-vl-utils dependency to pyproject.toml
myhloli
2026-01-06 14:44:53 +08:00 -
815280dd23
fix: update pdfminer.six dependency to resolve CVE-2025-64512 and improve EXIF handling
myhloli
2026-01-06 14:42:48 +08:00 -
7b52f92aea
fix: update pdfminer.six dependency to resolve CVE-2025-64512 and improve EXIF handling
myhloli
2026-01-06 14:41:47 +08:00 -
33543b76c9
Merge pull request #4301 from myhloli/dev
Xiaomeng Zhao
2026-01-06 14:10:08 +08:00 -
ea5f8e98dd
fix: update pdfminer.six version to 20251230 in pyproject.toml
myhloli
2026-01-06 11:54:17 +08:00 -
8996e06448
fix: restore hybrid analyze imports in common.py for backend processing
myhloli
2026-01-06 11:51:31 +08:00 -
23bc263b85
Merge pull request #4299 from myhloli/add_docx
Xiaomeng Zhao
2026-01-06 11:27:20 +08:00 -
53fb1cd055
feat: implement DOCX processing in the converter
myhloli
2026-01-06 11:26:18 +08:00 -
f0ce905c7d
fix: update pdfminer.six version to 20251230 in pyproject.toml
myhloli
2026-01-05 19:08:25 +08:00 -
df33d483de
Merge remote-tracking branch 'origin/add_docx' into add_docx
myhloli
2026-01-05 17:44:38 +08:00 -
f44fb174ea
feat: add support for DOCX file format in converter
myhloli
2026-01-05 17:44:17 +08:00 -
70b1e73606
Merge pull request #4293 from Sidney233/docx-dev
Xiaomeng Zhao
2026-01-05 17:43:10 +08:00 -
11fb0a0199
fix: add util files
Sidney233
2026-01-05 17:40:37 +08:00 -
66f8f0e93a
Merge pull request #4292 from Sidney233/docx-dev
Xiaomeng Zhao
2026-01-05 14:10:21 +08:00 -
942c1693c7
Merge branch 'add_docx' into docx-dev
Xiaomeng Zhao
2026-01-05 14:10:04 +08:00 -
7387797b17
work review
Sidney233
2026-01-05 13:33:55 +08:00 -
bfb304ef1f
fix: improve EXIF handling and save PDF logic in pdf_image_tools.py
myhloli
2026-01-05 00:27:01 +08:00 -
17e6016b58
Merge pull request #4283 from kingdomad/fix/image-exif-rotation
Xiaomeng Zhao
2026-01-04 18:31:06 +08:00 -
ba06cd14ef
Update pdf_image_tools.py
Xiaomeng Zhao
2026-01-04 18:29:51 +08:00 -
0209ada8d0
Merge pull request #4287 from myhloli/dev
Xiaomeng Zhao
2026-01-04 15:26:16 +08:00 -
e2140222bc
docs: update VastAI.md with new version numbers and improved instructions
myhloli
2026-01-04 15:24:23 +08:00 -
d679d99192
docs: update heading from '快速开始' to '快速入门' for consistency
myhloli
2026-01-04 15:16:15 +08:00 -
4bfcc0b808
Merge pull request #4286 from opendatalab/master
Xiaomeng Zhao
2026-01-04 15:12:00 +08:00 -
ead29489ff
Merge pull request #4285 from myhloli/dev
Xiaomeng Zhao
2026-01-04 15:11:29 +08:00 -
c01e35b4c6
docs: update navigation and terminology in documentation for clarity
myhloli
2026-01-04 15:10:37 +08:00 -
a89249069c
Merge pull request #4284 from myhloli/dev
Xiaomeng Zhao
2026-01-04 14:34:15 +08:00