mirror of
https://github.com/DS4SD/docling.git
synced 2025-08-02 15:32:30 +00:00
updated the cli to export html
Signed-off-by: Peter Staar <taa@zurich.ibm.com>
This commit is contained in:
parent
9f5e512080
commit
a062ab1937
@ -87,6 +87,7 @@ def export_documents(
|
|||||||
conv_results: Iterable[ConversionResult],
|
conv_results: Iterable[ConversionResult],
|
||||||
output_dir: Path,
|
output_dir: Path,
|
||||||
export_json: bool,
|
export_json: bool,
|
||||||
|
export_html: bool,
|
||||||
export_md: bool,
|
export_md: bool,
|
||||||
export_txt: bool,
|
export_txt: bool,
|
||||||
export_doctags: bool,
|
export_doctags: bool,
|
||||||
@ -100,13 +101,20 @@ def export_documents(
|
|||||||
success_count += 1
|
success_count += 1
|
||||||
doc_filename = conv_res.input.file.stem
|
doc_filename = conv_res.input.file.stem
|
||||||
|
|
||||||
# Export Deep Search document JSON format:
|
# Export JSON format:
|
||||||
if export_json:
|
if export_json:
|
||||||
fname = output_dir / f"{doc_filename}.json"
|
fname = output_dir / f"{doc_filename}.json"
|
||||||
with fname.open("w", encoding="utf8") as fp:
|
with fname.open("w", encoding="utf8") as fp:
|
||||||
_log.info(f"writing JSON output to {fname}")
|
_log.info(f"writing JSON output to {fname}")
|
||||||
fp.write(json.dumps(conv_res.document.export_to_dict()))
|
fp.write(json.dumps(conv_res.document.export_to_dict()))
|
||||||
|
|
||||||
|
# Export HTML format:
|
||||||
|
if export_html:
|
||||||
|
fname = output_dir / f"{doc_filename}.html"
|
||||||
|
with fname.open("w", encoding="utf8") as fp:
|
||||||
|
_log.info(f"writing HTML output to {fname}")
|
||||||
|
fp.write(conv_res.document.export_to_html())
|
||||||
|
|
||||||
# Export Text format:
|
# Export Text format:
|
||||||
if export_txt:
|
if export_txt:
|
||||||
fname = output_dir / f"{doc_filename}.txt"
|
fname = output_dir / f"{doc_filename}.txt"
|
||||||
@ -299,6 +307,7 @@ def convert(
|
|||||||
to_formats = [OutputFormat.MARKDOWN]
|
to_formats = [OutputFormat.MARKDOWN]
|
||||||
|
|
||||||
export_json = OutputFormat.JSON in to_formats
|
export_json = OutputFormat.JSON in to_formats
|
||||||
|
export_html = OutputFormat.HTML in to_formats
|
||||||
export_md = OutputFormat.MARKDOWN in to_formats
|
export_md = OutputFormat.MARKDOWN in to_formats
|
||||||
export_txt = OutputFormat.TEXT in to_formats
|
export_txt = OutputFormat.TEXT in to_formats
|
||||||
export_doctags = OutputFormat.DOCTAGS in to_formats
|
export_doctags = OutputFormat.DOCTAGS in to_formats
|
||||||
@ -364,6 +373,7 @@ def convert(
|
|||||||
conv_results,
|
conv_results,
|
||||||
output_dir=output,
|
output_dir=output,
|
||||||
export_json=export_json,
|
export_json=export_json,
|
||||||
|
export_html=export_html,
|
||||||
export_md=export_md,
|
export_md=export_md,
|
||||||
export_txt=export_txt,
|
export_txt=export_txt,
|
||||||
export_doctags=export_doctags,
|
export_doctags=export_doctags,
|
||||||
|
Loading…
Reference in New Issue
Block a user