From f5528623a77d9a3b0d821035f66baefd49da8dd9 Mon Sep 17 00:00:00 2001 From: Cesar Berrospi Ramis <75900930+ceberam@users.noreply.github.com> Date: Mon, 17 Nov 2025 12:48:41 +0100 Subject: [PATCH] docs(examples): remove deprecation warnings with export_to_dataframe (#2638) fix: remove deprecation warnings with export_to_dataframe Signed-off-by: Cesar Berrospi Ramis --- docs/examples/export_tables.py | 2 +- docs/v2.md | 5 ++++- tests/verify_utils.py | 3 --- 3 files changed, 5 insertions(+), 5 deletions(-) diff --git a/docs/examples/export_tables.py b/docs/examples/export_tables.py index 8d02d45f..a673ea9d 100644 --- a/docs/examples/export_tables.py +++ b/docs/examples/export_tables.py @@ -52,7 +52,7 @@ def main(): # Export tables for table_ix, table in enumerate(conv_res.document.tables): - table_df: pd.DataFrame = table.export_to_dataframe() + table_df: pd.DataFrame = table.export_to_dataframe(doc=conv_res.document) print(f"## Table {table_ix}") print(table_df.to_markdown()) diff --git a/docs/v2.md b/docs/v2.md index 395555d9..257b35f5 100644 --- a/docs/v2.md +++ b/docs/v2.md @@ -146,6 +146,9 @@ is now available in conversion results as a `DoclingDocument` object. `DoclingDocument` provides a neat set of APIs to construct, iterate and export content in the document, as shown below. ```python +import pandas as pd +from docling_core.types.doc import TextItem, TableItem + conv_result: ConversionResult = doc_converter.convert("https://arxiv.org/pdf/2408.09869") # previously `convert_single` ## Inspect the converted document: @@ -156,7 +159,7 @@ for item, level in conv_result.document.iterate_items(): if isinstance(item, TextItem): print(item.text) elif isinstance(item, TableItem): - table_df: pd.DataFrame = item.export_to_dataframe() + table_df: pd.DataFrame = item.export_to_dataframe(doc=conv_result.document) print(table_df.to_markdown()) elif ...: #... diff --git a/tests/verify_utils.py b/tests/verify_utils.py index ad02ca3a..c76b8ed4 100644 --- a/tests/verify_utils.py +++ b/tests/verify_utils.py @@ -171,9 +171,6 @@ def verify_table_v2(true_item: TableItem, pred_item: TableItem, fuzzy: bool): assert true_item.data is not None, "documents are expected to have table data" assert pred_item.data is not None, "documents are expected to have table data" - # print("True: \n", true_item.export_to_dataframe().to_markdown()) - # print("Pred: \n", true_item.export_to_dataframe().to_markdown()) - for i, row in enumerate(true_item.data.grid): for j, col in enumerate(true_item.data.grid[i]): # print("true: ", true_item.data[i][j].text)