mirror of
https://github.com/DS4SD/docling.git
synced 2025-12-08 20:58:11 +00:00
Commit Graph
Select branches
Hide Pull Requests
add-json-export-indentation
adr-model-stages
cau/dpv4-test-updates
cau/fix-layout-vlm-pipeline-artifacts-path
cau/layout-vlm-pipeline-page-images
cau/multi-stage-vlm-pipeline
cau/new-layout-processing
cau/pin-docling-parse-pre-3.2
cau/test-dp-word-lines
cau/test-pypdfium2-beta
copilot/fix-document-timeout-bug
copilot/fix-keyerror-in-docling
copilot/fix-page-range-bug
cp_main_20250602
demo
dev-granite-docling-table
dev/add-asr-pipeline
dev/add-granite-docling-extension
dev/add-granite-docling-preview
dev/add-r2l-tests
dev/add-reading-order-model
dev/add-two-stage-vlm
dev/analysis-for-granite-docling
dev/doctag_backend
dev/fix_msword_backend_identify_text_after_image
dev/table-orientation
dev/update-html-parser-with-h1
dev/update-to-latest-docling-parse-again
docs/add-extraction-script
elh/update_2stage_inference
extend-metadata-in-examples
gh-pages
main
mao/doctags
mly/smol-docling-integration
nli/fix_glm_utils
nli/fix_ocr_tests
nli/layout_dfine
nli/layout_heron2
nli/layout_rtdetr_v2
nli/layoutmodel_improvements
nli/tesseract_ocr_models
ocr-enrichment
pretest-core-2-51-0
propagate-core-fixes-20250502
remodel-lists-2
revert-803-refactor_viz
rtdl/docx_latex
rtdl/drawingml_import
vku/uspto_meta
#1
#10
#100
#101
#1010
#1015
#1017
#102
#1021
#1024
#1027
#103
#1038
#1039
#1040
#1041
#1051
#1052
#1053
#1054
#1055
#1057
#1061
#1062
#1077
#1096
#1097
#1098
#11
#110
#1100
#1106
#1107
#111
#1114
#1115
#1118
#1124
#1130
#1140
#1141
#1147
#1150
#1152
#1154
#1156
#1158
#1160
#1165
#1167
#117
#1173
#118
#1182
#1183
#1194
#1196
#1197
#1199
#12
#120
#1201
#121
#1210
#122
#1220
#1222
#1223
#123
#1231
#1238
#1239
#1241
#1244
#1247
#1248
#1261
#1263
#1268
#1270
#1286
#129
#1294
#1295
#13
#131
#1313
#1315
#1316
#1319
#132
#1320
#1326
#1328
#1332
#1334
#1337
#134
#1340
#1346
#135
#1350
#1355
#1359
#1363
#1371
#1375
#1377
#1378
#1379
#138
#1381
#1382
#1383
#1389
#139
#1392
#1399
#14
#140
#1400
#1402
#141
#1411
#1415
#1416
#1419
#1427
#1428
#143
#1430
#1436
#1442
#1449
#145
#1458
#1459
#1463
#1465
#1486
#149
#1490
#1492
#1494
#1496
#15
#150
#1500
#151
#1511
#1512
#152
#1520
#1523
#1524
#1525
#1526
#1527
#1528
#153
#1530
#1536
#1538
#154
#1548
#1549
#155
#1551
#1553
#1556
#1559
#156
#1560
#1561
#1563
#1566
#157
#1570
#1576
#1577
#158
#1582
#1583
#1587
#1589
#159
#1593
#1596
#16
#160
#1600
#1609
#161
#1610
#1615
#1617
#1619
#162
#1636
#164
#1658
#1659
#1660
#1663
#1664
#1665
#1667
#1671
#1673
#1676
#1679
#168
#1683
#1684
#1688
#1689
#169
#1691
#1698
#17
#170
#1700
#1701
#1706
#1707
#171
#1711
#1717
#1718
#1723
#1724
#1725
#1728
#173
#1734
#1735
#1745
#1746
#1747
#175
#1759
#1763
#1769
#177
#1772
#1775
#178
#179
#1791
#1795
#18
#180
#1802
#1804
#1808
#1810
#1812
#1815
#1816
#1819
#182
#1820
#1821
#1824
#1825
#1827
#183
#1836
#1838
#184
#1844
#1850
#1851
#1852
#1856
#1857
#186
#1863
#1866
#1867
#187
#1870
#1874
#1875
#1876
#188
#1884
#189
#1897
#1898
#1898
#19
#190
#1902
#1904
#1905
#1907
#1908
#1910
#1912
#1914
#1917
#1923
#1925
#1926
#1928
#193
#1931
#1934
#1937
#194
#1940
#1943
#1948
#1951
#1952
#196
#1960
#1969
#1970
#1971
#1975
#1981
#1982
#1984
#1986
#1988
#1989
#1992
#1995
#2
#20
#2001
#2002
#2006
#2011
#2017
#2018
#2024
#203
#2031
#2039
#2042
#2048
#2061
#2068
#2069
#2078
#2079
#2083
#2084
#2084
#2088
#2093
#2094
#2095
#2095
#21
#2100
#2105
#2106
#2110
#2111
#2112
#2113
#2114
#2114
#2122
#2123
#2124
#2126
#2131
#2132
#2133
#2138
#214
#2141
#2146
#2154
#2155
#2165
#2166
#2169
#217
#217
#2171
#2178
#218
#218
#2183
#2185
#2187
#219
#2199
#22
#2200
#2208
#2212
#2218
#2219
#2227
#2227
#2231
#2234
#2237
#2238
#224
#2242
#2244
#2251
#2252
#226
#2262
#2264
#2265
#2266
#2272
#228
#2281
#2284
#2284
#2287
#2288
#229
#2291
#2294
#2304
#2309
#2313
#2315
#2322
#2323
#2324
#233
#2339
#234
#2340
#2341
#235
#2357
#2359
#2361
#2365
#2366
#2371
#2372
#2373
#2378
#2378
#2382
#2383
#2388
#2391
#2394
#240
#2401
#2403
#2403
#2404
#2407
#2409
#2409
#241
#2410
#2411
#2413
#2415
#2418
#2420
#2421
#2422
#2423
#2424
#2425
#2426
#2427
#2429
#2430
#2431
#2433
#2436
#2441
#2442
#2445
#2445
#2447
#2452
#2453
#2454
#2458
#2459
#2468
#2473
#2474
#248
#2484
#2486
#2488
#2488
#2489
#2498
#2499
#2501
#2502
#2503
#251
#2511
#2512
#2513
#2517
#2519
#2520
#2521
#2526
#2527
#2530
#2531
#2533
#2541
#2543
#2546
#2548
#2549
#2553
#2563
#2569
#2571
#2573
#2578
#2582
#2585
#2587
#2587
#2588
#2589
#259
#2596
#2599
#26
#2600
#2605
#2613
#2618
#2622
#2622
#2624
#2627
#2636
#2637
#2638
#2639
#2640
#2641
#2644
#2645
#2645
#2648
#2649
#2651
#2653
#2656
#2658
#2659
#2660
#2662
#2664
#2665
#2669
#2671
#2674
#2676
#2676
#2678
#2678
#2682
#2682
#2689
#2692
#2693
#27
#2706
#2707
#2708
#2712
#2716
#2717
#2720
#2721
#2721
#2723
#2723
#2728
#2735
#2738
#2738
#2739
#2740
#2740
#2741
#2741
#275
#276
#279
#28
#282
#286
#29
#290
#3
#302
#305
#307
#31
#310
#312
#314
#315
#316
#319
#32
#320
#322
#323
#325
#33
#330
#332
#334
#339
#34
#340
#341
#349
#35
#350
#36
#37
#371
#374
#375
#378
#379
#38
#384
#388
#39
#392
#393
#396
#4
#40
#401
#407
#408
#409
#415
#416
#42
#429
#43
#430
#432
#44
#442
#449
#45
#451
#456
#457
#46
#466
#467
#468
#47
#472
#474
#475
#482
#484
#487
#49
#490
#492
#495
#496
#497
#5
#50
#500
#501
#502
#504
#51
#511
#512
#513
#514
#517
#52
#528
#53
#530
#531
#532
#533
#534
#537
#54
#544
#549
#550
#551
#552
#555
#556
#557
#558
#56
#569
#57
#58
#59
#593
#6
#604
#606
#608
#613
#615
#616
#618
#624
#628
#63
#630
#631
#633
#642
#65
#650
#655
#656
#662
#675
#679
#68
#69
#691
#693
#694
#695
#697
#698
#7
#70
#700
#701
#702
#708
#71
#716
#717
#718
#719
#72
#733
#735
#739
#742
#75
#752
#759
#769
#772
#777
#783
#786
#788
#79
#793
#8
#80
#800
#801
#803
#804
#805
#808
#81
#811
#814
#815
#816
#817
#818
#819
#82
#820
#821
#824
#825
#826
#827
#83
#830
#831
#832
#837
#839
#84
#841
#842
#843
#850
#852
#853
#854
#855
#856
#857
#86
#862
#868
#869
#872
#873
#874
#875
#876
#878
#88
#880
#881
#883
#896
#897
#90
#901
#903
#905
#91
#910
#912
#916
#919
#92
#929
#93
#932
#935
#940
#941
#945
#948
#949
#95
#951
#958
#96
#965
#966
#967
#98
#99
#999
v0.1.1
v0.2.0
v0.3.0
v0.3.1
v0.4.0
v1.0.0
v1.0.1
v1.0.2
v1.1.0
v1.1.1
v1.1.2
v1.10.0
v1.11.0
v1.12.0
v1.12.1
v1.12.2
v1.13.0
v1.13.1
v1.14.0
v1.15.0
v1.16.0
v1.16.1
v1.17.0
v1.18.0
v1.19.0
v1.19.1
v1.2.0
v1.2.1
v1.20.0
v1.3.0
v1.4.0
v1.5.0
v1.6.0
v1.6.1
v1.6.2
v1.6.3
v1.7.0
v1.7.1
v1.8.0
v1.8.1
v1.8.2
v1.8.3
v1.8.4
v1.8.5
v1.9.0
v2.0.0
v2.1.0
v2.10.0
v2.11.0
v2.12.0
v2.13.0
v2.14.0
v2.15.0
v2.15.1
v2.16.0
v2.17.0
v2.18.0
v2.19.0
v2.2.0
v2.2.1
v2.20.0
v2.21.0
v2.22.0
v2.23.0
v2.23.1
v2.24.0
v2.25.0
v2.25.1
v2.25.2
v2.26.0
v2.27.0
v2.28.0
v2.28.1
v2.28.2
v2.28.3
v2.28.4
v2.29.0
v2.3.0
v2.3.1
v2.30.0
v2.31.0
v2.31.1
v2.31.2
v2.32.0
v2.33.0
v2.34.0
v2.35.0
v2.36.0
v2.36.1
v2.37.0
v2.38.0
v2.38.1
v2.39.0
v2.4.0
v2.4.1
v2.4.2
v2.40.0
v2.41.0
v2.42.0
v2.42.1
v2.42.2
v2.43.0
v2.44.0
v2.45.0
v2.46.0
v2.47.0
v2.47.1
v2.48.0
v2.49.0
v2.5.0
v2.5.1
v2.5.2
v2.50.0
v2.51.0
v2.52.0
v2.53.0
v2.54.0
v2.55.0
v2.55.1
v2.56.0
v2.56.1
v2.57.0
v2.58.0
v2.59.0
v2.6.0
v2.60.0
v2.60.1
v2.61.0
v2.61.1
v2.61.2
v2.62.0
v2.63.0
v2.64.0
v2.7.0
v2.7.1
v2.8.0
v2.8.1
v2.8.2
v2.8.3
v2.9.0
Select branches
Hide Pull Requests
add-json-export-indentation
adr-model-stages
cau/dpv4-test-updates
cau/fix-layout-vlm-pipeline-artifacts-path
cau/layout-vlm-pipeline-page-images
cau/multi-stage-vlm-pipeline
cau/new-layout-processing
cau/pin-docling-parse-pre-3.2
cau/test-dp-word-lines
cau/test-pypdfium2-beta
copilot/fix-document-timeout-bug
copilot/fix-keyerror-in-docling
copilot/fix-page-range-bug
cp_main_20250602
demo
dev-granite-docling-table
dev/add-asr-pipeline
dev/add-granite-docling-extension
dev/add-granite-docling-preview
dev/add-r2l-tests
dev/add-reading-order-model
dev/add-two-stage-vlm
dev/analysis-for-granite-docling
dev/doctag_backend
dev/fix_msword_backend_identify_text_after_image
dev/table-orientation
dev/update-html-parser-with-h1
dev/update-to-latest-docling-parse-again
docs/add-extraction-script
elh/update_2stage_inference
extend-metadata-in-examples
gh-pages
main
mao/doctags
mly/smol-docling-integration
nli/fix_glm_utils
nli/fix_ocr_tests
nli/layout_dfine
nli/layout_heron2
nli/layout_rtdetr_v2
nli/layoutmodel_improvements
nli/tesseract_ocr_models
ocr-enrichment
pretest-core-2-51-0
propagate-core-fixes-20250502
remodel-lists-2
revert-803-refactor_viz
rtdl/docx_latex
rtdl/drawingml_import
vku/uspto_meta
#1
#10
#100
#101
#1010
#1015
#1017
#102
#1021
#1024
#1027
#103
#1038
#1039
#1040
#1041
#1051
#1052
#1053
#1054
#1055
#1057
#1061
#1062
#1077
#1096
#1097
#1098
#11
#110
#1100
#1106
#1107
#111
#1114
#1115
#1118
#1124
#1130
#1140
#1141
#1147
#1150
#1152
#1154
#1156
#1158
#1160
#1165
#1167
#117
#1173
#118
#1182
#1183
#1194
#1196
#1197
#1199
#12
#120
#1201
#121
#1210
#122
#1220
#1222
#1223
#123
#1231
#1238
#1239
#1241
#1244
#1247
#1248
#1261
#1263
#1268
#1270
#1286
#129
#1294
#1295
#13
#131
#1313
#1315
#1316
#1319
#132
#1320
#1326
#1328
#1332
#1334
#1337
#134
#1340
#1346
#135
#1350
#1355
#1359
#1363
#1371
#1375
#1377
#1378
#1379
#138
#1381
#1382
#1383
#1389
#139
#1392
#1399
#14
#140
#1400
#1402
#141
#1411
#1415
#1416
#1419
#1427
#1428
#143
#1430
#1436
#1442
#1449
#145
#1458
#1459
#1463
#1465
#1486
#149
#1490
#1492
#1494
#1496
#15
#150
#1500
#151
#1511
#1512
#152
#1520
#1523
#1524
#1525
#1526
#1527
#1528
#153
#1530
#1536
#1538
#154
#1548
#1549
#155
#1551
#1553
#1556
#1559
#156
#1560
#1561
#1563
#1566
#157
#1570
#1576
#1577
#158
#1582
#1583
#1587
#1589
#159
#1593
#1596
#16
#160
#1600
#1609
#161
#1610
#1615
#1617
#1619
#162
#1636
#164
#1658
#1659
#1660
#1663
#1664
#1665
#1667
#1671
#1673
#1676
#1679
#168
#1683
#1684
#1688
#1689
#169
#1691
#1698
#17
#170
#1700
#1701
#1706
#1707
#171
#1711
#1717
#1718
#1723
#1724
#1725
#1728
#173
#1734
#1735
#1745
#1746
#1747
#175
#1759
#1763
#1769
#177
#1772
#1775
#178
#179
#1791
#1795
#18
#180
#1802
#1804
#1808
#1810
#1812
#1815
#1816
#1819
#182
#1820
#1821
#1824
#1825
#1827
#183
#1836
#1838
#184
#1844
#1850
#1851
#1852
#1856
#1857
#186
#1863
#1866
#1867
#187
#1870
#1874
#1875
#1876
#188
#1884
#189
#1897
#1898
#1898
#19
#190
#1902
#1904
#1905
#1907
#1908
#1910
#1912
#1914
#1917
#1923
#1925
#1926
#1928
#193
#1931
#1934
#1937
#194
#1940
#1943
#1948
#1951
#1952
#196
#1960
#1969
#1970
#1971
#1975
#1981
#1982
#1984
#1986
#1988
#1989
#1992
#1995
#2
#20
#2001
#2002
#2006
#2011
#2017
#2018
#2024
#203
#2031
#2039
#2042
#2048
#2061
#2068
#2069
#2078
#2079
#2083
#2084
#2084
#2088
#2093
#2094
#2095
#2095
#21
#2100
#2105
#2106
#2110
#2111
#2112
#2113
#2114
#2114
#2122
#2123
#2124
#2126
#2131
#2132
#2133
#2138
#214
#2141
#2146
#2154
#2155
#2165
#2166
#2169
#217
#217
#2171
#2178
#218
#218
#2183
#2185
#2187
#219
#2199
#22
#2200
#2208
#2212
#2218
#2219
#2227
#2227
#2231
#2234
#2237
#2238
#224
#2242
#2244
#2251
#2252
#226
#2262
#2264
#2265
#2266
#2272
#228
#2281
#2284
#2284
#2287
#2288
#229
#2291
#2294
#2304
#2309
#2313
#2315
#2322
#2323
#2324
#233
#2339
#234
#2340
#2341
#235
#2357
#2359
#2361
#2365
#2366
#2371
#2372
#2373
#2378
#2378
#2382
#2383
#2388
#2391
#2394
#240
#2401
#2403
#2403
#2404
#2407
#2409
#2409
#241
#2410
#2411
#2413
#2415
#2418
#2420
#2421
#2422
#2423
#2424
#2425
#2426
#2427
#2429
#2430
#2431
#2433
#2436
#2441
#2442
#2445
#2445
#2447
#2452
#2453
#2454
#2458
#2459
#2468
#2473
#2474
#248
#2484
#2486
#2488
#2488
#2489
#2498
#2499
#2501
#2502
#2503
#251
#2511
#2512
#2513
#2517
#2519
#2520
#2521
#2526
#2527
#2530
#2531
#2533
#2541
#2543
#2546
#2548
#2549
#2553
#2563
#2569
#2571
#2573
#2578
#2582
#2585
#2587
#2587
#2588
#2589
#259
#2596
#2599
#26
#2600
#2605
#2613
#2618
#2622
#2622
#2624
#2627
#2636
#2637
#2638
#2639
#2640
#2641
#2644
#2645
#2645
#2648
#2649
#2651
#2653
#2656
#2658
#2659
#2660
#2662
#2664
#2665
#2669
#2671
#2674
#2676
#2676
#2678
#2678
#2682
#2682
#2689
#2692
#2693
#27
#2706
#2707
#2708
#2712
#2716
#2717
#2720
#2721
#2721
#2723
#2723
#2728
#2735
#2738
#2738
#2739
#2740
#2740
#2741
#2741
#275
#276
#279
#28
#282
#286
#29
#290
#3
#302
#305
#307
#31
#310
#312
#314
#315
#316
#319
#32
#320
#322
#323
#325
#33
#330
#332
#334
#339
#34
#340
#341
#349
#35
#350
#36
#37
#371
#374
#375
#378
#379
#38
#384
#388
#39
#392
#393
#396
#4
#40
#401
#407
#408
#409
#415
#416
#42
#429
#43
#430
#432
#44
#442
#449
#45
#451
#456
#457
#46
#466
#467
#468
#47
#472
#474
#475
#482
#484
#487
#49
#490
#492
#495
#496
#497
#5
#50
#500
#501
#502
#504
#51
#511
#512
#513
#514
#517
#52
#528
#53
#530
#531
#532
#533
#534
#537
#54
#544
#549
#550
#551
#552
#555
#556
#557
#558
#56
#569
#57
#58
#59
#593
#6
#604
#606
#608
#613
#615
#616
#618
#624
#628
#63
#630
#631
#633
#642
#65
#650
#655
#656
#662
#675
#679
#68
#69
#691
#693
#694
#695
#697
#698
#7
#70
#700
#701
#702
#708
#71
#716
#717
#718
#719
#72
#733
#735
#739
#742
#75
#752
#759
#769
#772
#777
#783
#786
#788
#79
#793
#8
#80
#800
#801
#803
#804
#805
#808
#81
#811
#814
#815
#816
#817
#818
#819
#82
#820
#821
#824
#825
#826
#827
#83
#830
#831
#832
#837
#839
#84
#841
#842
#843
#850
#852
#853
#854
#855
#856
#857
#86
#862
#868
#869
#872
#873
#874
#875
#876
#878
#88
#880
#881
#883
#896
#897
#90
#901
#903
#905
#91
#910
#912
#916
#919
#92
#929
#93
#932
#935
#940
#941
#945
#948
#949
#95
#951
#958
#96
#965
#966
#967
#98
#99
#999
v0.1.1
v0.2.0
v0.3.0
v0.3.1
v0.4.0
v1.0.0
v1.0.1
v1.0.2
v1.1.0
v1.1.1
v1.1.2
v1.10.0
v1.11.0
v1.12.0
v1.12.1
v1.12.2
v1.13.0
v1.13.1
v1.14.0
v1.15.0
v1.16.0
v1.16.1
v1.17.0
v1.18.0
v1.19.0
v1.19.1
v1.2.0
v1.2.1
v1.20.0
v1.3.0
v1.4.0
v1.5.0
v1.6.0
v1.6.1
v1.6.2
v1.6.3
v1.7.0
v1.7.1
v1.8.0
v1.8.1
v1.8.2
v1.8.3
v1.8.4
v1.8.5
v1.9.0
v2.0.0
v2.1.0
v2.10.0
v2.11.0
v2.12.0
v2.13.0
v2.14.0
v2.15.0
v2.15.1
v2.16.0
v2.17.0
v2.18.0
v2.19.0
v2.2.0
v2.2.1
v2.20.0
v2.21.0
v2.22.0
v2.23.0
v2.23.1
v2.24.0
v2.25.0
v2.25.1
v2.25.2
v2.26.0
v2.27.0
v2.28.0
v2.28.1
v2.28.2
v2.28.3
v2.28.4
v2.29.0
v2.3.0
v2.3.1
v2.30.0
v2.31.0
v2.31.1
v2.31.2
v2.32.0
v2.33.0
v2.34.0
v2.35.0
v2.36.0
v2.36.1
v2.37.0
v2.38.0
v2.38.1
v2.39.0
v2.4.0
v2.4.1
v2.4.2
v2.40.0
v2.41.0
v2.42.0
v2.42.1
v2.42.2
v2.43.0
v2.44.0
v2.45.0
v2.46.0
v2.47.0
v2.47.1
v2.48.0
v2.49.0
v2.5.0
v2.5.1
v2.5.2
v2.50.0
v2.51.0
v2.52.0
v2.53.0
v2.54.0
v2.55.0
v2.55.1
v2.56.0
v2.56.1
v2.57.0
v2.58.0
v2.59.0
v2.6.0
v2.60.0
v2.60.1
v2.61.0
v2.61.1
v2.61.2
v2.62.0
v2.63.0
v2.64.0
v2.7.0
v2.7.1
v2.8.0
v2.8.1
v2.8.2
v2.8.3
v2.9.0
-
5f5fea90a9
docs: update custom convert and dockerfile (#226)
Michele Dolfi
2024-11-04 14:27:40 +01:00 -
41acaa9e2e
docs: correct spelling of 'individual' (#219)
Vicky Sekhon
2024-11-04 08:27:02 -05:00 -
40ad987303
feat: pdf backend, table mode as options and artifacts path (#203)
Michele Dolfi
2024-11-04 14:26:05 +01:00 -
af323c04ef
fit: Specify encoding when writing output file (#214)
Johnny Salazar
2024-11-04 20:24:13 +07:00 -
8fb445f46c
chore: make tests lighter (#228)
Panos Vagenas
2024-11-04 14:02:28 +01:00 -
5fc4d5bd3d
work-in-progress: dealing with in attributes of html elements
Peter Staar
2024-11-02 09:27:07 +01:00 -
244ca69cfd
docs: update LlamaIndex docs (#196)
Panos Vagenas
2024-11-01 20:55:28 +01:00 -
473ad9a032
add the skip_furniture parameter
Peter Staar
2024-11-01 11:32:56 +01:00 -
ebe0b203c8
added the detection of h1 and the skip_furniture parameter
Peter Staar
2024-10-31 16:06:41 +01:00 -
c52e68c52b
feat: add ability to detect h1 and filter from there-on
Peter Staar
2024-10-31 15:50:26 +01:00 -
9d8865856d
chore: bump version to 2.3.1 [skip ci]
v2.3.1
github-actions[bot]
2024-10-30 18:23:53 +00:00 -
eb679ccbb4
fix: simplify torch dependencies and update pinned docling deps (#190)
Michele Dolfi
2024-10-30 18:44:08 +01:00 -
904d24d600
fix: allow to explicitly initialize the pipeline (#189)
Michele Dolfi
2024-10-30 17:54:53 +01:00 -
43349865d0
chore: bump version to 2.3.0 [skip ci]
v2.3.0
github-actions[bot]
2024-10-30 14:47:37 +00:00 -
2a2c65bf4f
feat: Add pipeline timings and toggle visualization, establish debug settings (#183)
Christoph Auer
2024-10-30 15:04:19 +01:00 -
94a5290789
chore: update the with input formats and DoclingDocument (#188)
Peter W. J. Staar
2024-10-30 15:02:28 +01:00 -
f542460af3
fix: fix duplicate title and heading + add e2e tests for html and docx (#186)
Peter W. J. Staar
2024-10-30 13:14:56 +01:00 -
70865b4c7d
fix: make CLI JSON export more human-readable
add-json-export-indentation
Panos Vagenas
2024-10-29 08:54:41 +01:00 -
dda2645d4c
chore: bump version to 2.2.1 [skip ci]
v2.2.1
github-actions[bot]
2024-10-28 17:18:41 +00:00 -
b9f5c74a7d
fix: fix header levels for DOCX & HTML (#184)
Panos Vagenas
2024-10-28 17:02:52 +01:00 -
94d0729c50
fix: handling of long sequence of unescaped underscore chars in markdown (#173)
Maxim Lysak
2024-10-28 16:34:48 +01:00 -
2cece27208
docs: update LlamaIndex docs for Docling v2 (#182)
Panos Vagenas
2024-10-28 14:28:26 +01:00 -
189d3c2d44
docs: fix batch convert (#177)
Michele Dolfi
2024-10-26 05:50:34 +02:00 -
7d19418b77
fix: HTML backend, fixes for Lists and nested texts (#180)
Maxim Lysak
2024-10-25 20:14:04 +02:00 -
88c1673057
fix: MD Backend, fixes to properly handle trailing inline text and emphasis in headers (#178)
Maxim Lysak
2024-10-25 18:02:20 +02:00 -
77a89c3334
chore: make auto-release on request (#179)
Michele Dolfi
2024-10-25 10:47:25 +02:00 -
8d356aa247
docs: add export with embedded images (#175)
Michele Dolfi
2024-10-24 20:19:41 +02:00 -
8208c93e3a
chore: bump version to 2.2.0 [skip ci]
v2.2.0
github-actions[bot]
2024-10-23 16:04:55 +00:00 -
4116819b51
feat: Update to docling-parse v2 without history (#170)
Peter W. J. Staar
2024-10-23 17:20:11 +02:00 -
3023f18ba0
feat: Support AsciiDoc and Markdown input format (#168)
Christoph Auer
2024-10-23 16:14:26 +02:00 -
3496b4838f
fix: set valid=false for invalid backends (#171)
Michele Dolfi
2024-10-23 15:52:30 +02:00 -
b8d2286dd1
chore: various minor docs fixes (#169)
Panos Vagenas
2024-10-22 15:29:36 +02:00 -
fa5f94ec10
Fix Typo errors in CONTRIBUTING.md file (#164)
Mohamed Ali
2024-10-22 10:31:48 +05:30 -
d5460e2d1f
chore: bump version to 2.1.0 [skip ci]
v2.1.0
github-actions[bot]
2024-10-18 13:21:15 +00:00 -
b346faf622
feat: add coverage_threshold to skip OCR for small images (#161)
Michele Dolfi
2024-10-18 13:58:23 +02:00 -
f799e777c1
docs: typo fix (#155)
ABHISHEK FADAKE
2024-10-18 17:26:48 +05:30 -
63bef59d9e
fix: fix legacy doc ref (#162)
Panos Vagenas
2024-10-18 13:11:20 +02:00 -
bb7a58d45d
ci: run ci also on forks (#160)
Michele Dolfi
2024-10-18 12:32:27 +02:00 -
a00c937e19
Ensure all models work only on valid pages (#158)
Christoph Auer
2024-10-18 08:54:06 +02:00 -
034a411057
docs: add graphical band in readme (#154)
Maxim Lysak
2024-10-17 18:15:40 +02:00 -
61c092f445
docs: add use docling (#150)
Michele Dolfi
2024-10-17 18:14:48 +02:00 -
24f949ada2
chore: run apt-get update before install (#156)
Michele Dolfi
2024-10-17 17:27:16 +02:00 -
a29c256041
chore: bump version to 2.0.0 [skip ci]
v2.0.0
github-actions[bot]
2024-10-16 19:48:06 +00:00 -
7d3be0edeb
feat!: Docling v2 (#117)
Christoph Auer
2024-10-16 21:02:03 +02:00 -
d504432c1e
docs: introduce docs site (#141)
Panos Vagenas
2024-10-14 14:13:13 +02:00 -
2b1e72d327
refactor: fix type of tesseractocr options (#140)
Michele Dolfi
2024-10-14 08:40:22 +02:00 -
4672b24c1a
chore: bump version to 1.20.0 [skip ci]
v1.20.0
github-actions[bot]
2024-10-11 13:48:02 +00:00 -
5e4944f15f
feat: new experimental docling-parse v2 backend (#131)
Christoph Auer
2024-10-11 15:12:49 +02:00 -
2ec39636f0
chore: bump version to 1.19.1 [skip ci]
v1.19.1
github-actions[bot]
2024-10-11 08:52:09 +00:00 -
dae2a3b667
fix: remove stderr from tesseract cli and introduce fuzziness in the text validation of OCR tests (#138)
Nikos Livathinos
2024-10-11 10:21:19 +02:00 -
5f1bd9e9c8
docs: simplify LlamaIndex example using Docling extension (#135)
Panos Vagenas
2024-10-09 22:17:56 +02:00 -
6924999f1f
chore: explicitly manage pandas dependency (#134)
Panos Vagenas
2024-10-09 14:50:39 +02:00 -
0ffc1708d2
chore: bump version to 1.19.0 [skip ci]
v1.19.0
github-actions[bot]
2024-10-08 17:42:29 +00:00 -
f96ea86a00
feat: add options for choosing OCR engines (#118)
Michele Dolfi
2024-10-08 19:07:08 +02:00 -
d412c363d7
fixed unload pdf backend resources (#129)
Fasal Shah
2024-10-08 14:16:43 +05:30 -
86ead45aa1
align with isort
extend-metadata-in-examples
Panos Vagenas
2024-10-04 15:25:52 +02:00 -
86fd560cfd
minor notebook updates
Panos Vagenas
2024-10-04 14:50:38 +02:00 -
6e16a2464e
add docling splitter to LC example, simplify & align QA output
Panos Vagenas
2024-10-04 14:43:27 +02:00 -
f4ee76eaec
chore: showcase extended metadata in LlamaIndex example
Panos Vagenas
2024-09-27 19:31:43 +02:00 -
9b82ae3324
chore: bump version to 1.18.0 [skip ci]
v1.18.0
github-actions[bot]
2024-10-03 17:16:00 +00:00 -
2422f706a1
feat: new torch-based docling models (#120)
Maxim Lysak
2024-10-03 18:42:33 +02:00 -
9ebbbc1245
chore: bump version to 1.17.0 [skip ci]
v1.17.0
github-actions[bot]
2024-10-03 13:44:52 +00:00 -
dde0aff8bd
update examples (#123)
Rui Dias Gomes
2024-10-03 13:28:25 +01:00 -
d44c62d7ce
feat: windows support (#122)
Michele Dolfi
2024-10-03 14:23:47 +02:00 -
bfdc4e32cc
chore: Add test data with scanned documents and their conversions usinga EasyOCR
nli/tesseract_ocr_models
Nikos Livathinos
2024-10-02 13:35:38 +02:00 -
c211808742
feat: tesseract and tesserocr models. WIP.
Nikos Livathinos
2024-10-02 13:30:27 +02:00 -
455d6ff70f
chore: Add tesserocr in poetry
Nikos Livathinos
2024-10-02 13:27:34 +02:00 -
bbfc0617f2
feat: add options for choosing OCR engine
Michele Dolfi
2024-10-02 10:47:20 +02:00 -
cde671cf34
chore: bump version to 1.16.1 [skip ci]
v1.16.1
github-actions[bot]
2024-09-27 14:36:40 +00:00 -
34bd887a7f
fix: allow usage of opencv 4.6.x (#110)
Michele Dolfi
2024-09-27 15:51:43 +02:00 -
c05b692d69
docs: document chunking (#111)
Panos Vagenas
2024-09-27 11:16:04 +02:00 -
6760571fe1
chore: bump version to 1.16.0 [skip ci]
v1.16.0
github-actions[bot]
2024-09-27 06:21:15 +00:00 -
d6df76f90b
feat: Support tableformer model choice (#90)
Christoph Auer
2024-09-26 21:37:08 +02:00 -
39977b5631
chore: move examples extras to respective group (#103)
Panos Vagenas
2024-09-25 15:47:48 +02:00 -
3dfd02a7e9
chore: bump version to 1.15.0 [skip ci]
v1.15.0
github-actions[bot]
2024-09-24 15:58:16 +00:00 -
6a03c208ec
feat: add figure in markdown (#98)
Michele Dolfi
2024-09-24 17:28:23 +02:00 -
001d214a13
chore: bump version to 1.14.0 [skip ci]
v1.14.0
github-actions[bot]
2024-09-24 13:38:23 +00:00 -
d96b96c848
fix: fix OCR setting for pypdfium, minor refactor (#102)
Panos Vagenas
2024-09-24 14:36:00 +02:00 -
f8f2303348
docs: document CLI, minor README revamp (#100)
Panos Vagenas
2024-09-24 09:21:28 +02:00 -
f555815343
chore: add RAG notebook titles (#101)
Panos Vagenas
2024-09-24 09:17:46 +02:00 -
3c46e4266c
feat: add URL support to CLI (#99)
Panos Vagenas
2024-09-24 08:47:53 +02:00 -
c65a01c9b7
chore: bump version to 1.13.1 [skip ci]
v1.13.1
github-actions[bot]
2024-09-23 19:04:01 +00:00 -
4794ce460a
fix: updated the render_as_doctags with the new arguments from docling-core (#93)
Peter W. J. Staar
2024-09-23 20:12:18 +02:00 -
dce9934a0f
Updated to new, clean vector logo, svg and rendered png are provided (#96)
Maxim Lysak
2024-09-23 15:31:21 +02:00 -
1f4b224ab6
chore: switch to gh apps user (#92)
Michele Dolfi
2024-09-20 17:02:27 +02:00 -
6dd1e91c4a
chore: bump version to 1.13.0 [skip ci]
v1.13.0
github-actions[bot]
2024-09-18 09:26:03 +00:00 -
0da7519896
docs: updated Docling logo.png with transparent background (#88)
Maxim Lysak
2024-09-18 10:39:11 +02:00 -
f19bd43798
feat: add table exports (#86)
Michele Dolfi
2024-09-18 08:44:13 +02:00 -
442443a102
fix: bumped the glm version and adjusted the tests (#83)
Peter W. J. Staar
2024-09-18 07:43:49 +02:00 -
8242bce4fa
chore: bump version to 1.12.2 [skip ci]
v1.12.2
github-actions[bot]
2024-09-17 16:01:34 +00:00 -
fa9699fa3c
fix(tests): Adjust the test data to match the new version of LayoutPredictor (#82)
Nikos Livathinos
2024-09-17 15:50:35 +02:00 -
30a0ef69b4
chore: Add PR template (#81)
Michele Dolfi
2024-09-16 18:36:26 +02:00 -
f1932fd8c5
chore: bump version to 1.12.1 [skip ci]
v1.12.1
github-actions[bot]
2024-09-16 10:58:09 +00:00 -
2870fdc857
fix: CLI compatibility with python 3.10 and 3.11 (#79)
Michele Dolfi
2024-09-16 12:32:45 +02:00 -
34b2772a2e
chore: bump version to 1.12.0 [skip ci]
v1.12.0
github-actions[bot]
2024-09-13 12:34:15 +00:00 -
98990784df
feat: add docling cli (#75)
Peter W. J. Staar
2024-09-13 14:03:09 +02:00 -
8aa476ccd3
test: improve typing definitions (part 1) (#72)
Michele Dolfi
2024-09-12 15:56:29 +02:00 -
4090f9700b
add node parser, JSONPath resolution to LI example, refactor
demo
Panos Vagenas
2024-09-12 09:20:48 +02:00 -
d8ddb559fa
docs: add conversion example
Panos Vagenas
2024-09-12 06:39:10 +02:00 -
53569a1023
docs: showcase RAG with LlamaIndex and LangChain (#71)
Panos Vagenas
2024-09-11 15:07:08 +02:00