fix(pypdfium): resolve overlapping text when merging bounding boxes (#1549)

get merged_text from boundingbox instead of merging it to prevent overlaps

Signed-off-by: Pedro Ribeiro <pedro_ribeiro_93@hotmail.com>
This commit is contained in:
Pedro Ribeiro
2025-05-19 14:26:00 +01:00
committed by GitHub
parent 12a0e64892
commit 98b5eeb844
52 changed files with 52225 additions and 4690 deletions

View File

@@ -951,7 +951,7 @@
"page_no": 1,
"bbox": {
"l": 320.4467468261719,
"t": 352.359375,
"t": 352.3592834472656,
"r": 558.8576049804688,
"b": 81.689208984375,
"coord_origin": "BOTTOMLEFT"