mirror of
https://github.com/DS4SD/docling.git
synced 2025-07-27 04:24:45 +00:00
add example PNG
Signed-off-by: Michele Dolfi <dol@zurich.ibm.com>
This commit is contained in:
parent
a84ba6ddec
commit
3794f8245e
@ -25,6 +25,7 @@ input_paths = [
|
|||||||
Path("tests/data/lorem_ipsum.docx"),
|
Path("tests/data/lorem_ipsum.docx"),
|
||||||
Path("tests/data/powerpoint_sample.pptx"),
|
Path("tests/data/powerpoint_sample.pptx"),
|
||||||
Path("tests/data/2206.01062.pdf"),
|
Path("tests/data/2206.01062.pdf"),
|
||||||
|
# Path("tests/data/2305.03393v1-pg9-img.png"),
|
||||||
]
|
]
|
||||||
input = DocumentConversionInput.from_paths(input_paths)
|
input = DocumentConversionInput.from_paths(input_paths)
|
||||||
|
|
||||||
@ -35,6 +36,7 @@ input = DocumentConversionInput.from_paths(input_paths)
|
|||||||
doc_converter = DocumentConverter( # all of the below is optional, has internal defaults.
|
doc_converter = DocumentConverter( # all of the below is optional, has internal defaults.
|
||||||
formats=[
|
formats=[
|
||||||
InputFormat.PDF,
|
InputFormat.PDF,
|
||||||
|
# InputFormat.IMAGE,
|
||||||
InputFormat.DOCX,
|
InputFormat.DOCX,
|
||||||
], # whitelist formats, other files are ignored.
|
], # whitelist formats, other files are ignored.
|
||||||
format_options={
|
format_options={
|
||||||
|
BIN
tests/data/2305.03393v1-pg9-img.png
Normal file
BIN
tests/data/2305.03393v1-pg9-img.png
Normal file
Binary file not shown.
After Width: | Height: | Size: 301 KiB |
Loading…
Reference in New Issue
Block a user