diff --git a/tests/data/groundtruth/docling_v2/inline_and_formatting.md.md b/tests/data/groundtruth/docling_v2/inline_and_formatting.md.md index f8f71a37..625f1292 100644 --- a/tests/data/groundtruth/docling_v2/inline_and_formatting.md.md +++ b/tests/data/groundtruth/docling_v2/inline_and_formatting.md.md @@ -12,7 +12,7 @@ Create your feature branch: `git checkout -b feature/AmazingFeature` . 4. Push to the branch ( `git push origin feature/AmazingFeature` ) 5. Open a Pull Request -## +## *Second* section @@ -21,4 +21,4 @@ Create your feature branch: `git checkout -b feature/AmazingFeature` . | Bold Heading | Italic Heading | |----------------|------------------| -| data a | data b | \ No newline at end of file +| data a | data b | diff --git a/tests/data/groundtruth/docling_v2/inline_and_formatting.md.yaml b/tests/data/groundtruth/docling_v2/inline_and_formatting.md.yaml index 4ef8e189..9591eed7 100644 --- a/tests/data/groundtruth/docling_v2/inline_and_formatting.md.yaml +++ b/tests/data/groundtruth/docling_v2/inline_and_formatting.md.yaml @@ -150,7 +150,8 @@ pages: {} pictures: [] schema_name: DoclingDocument tables: -- captions: [] +- annotations: [] + captions: [] children: [] content_layer: body data: @@ -285,6 +286,7 @@ tables: prov: [] references: [] self_ref: '#/tables/0' + word_items_ids: [] texts: - children: [] content_layer: body @@ -295,6 +297,7 @@ texts: prov: [] self_ref: '#/texts/0' text: Contribution guideline example + word_items_ids: [] - children: [] content_layer: body label: text @@ -304,6 +307,7 @@ texts: prov: [] self_ref: '#/texts/1' text: This is simple. + word_items_ids: [] - children: [] content_layer: body label: text @@ -313,11 +317,13 @@ texts: prov: [] self_ref: '#/texts/2' text: Foo + word_items_ids: [] - children: [] content_layer: body formatting: bold: false italic: true + script: baseline strikethrough: false underline: false label: text @@ -327,11 +333,13 @@ texts: prov: [] self_ref: '#/texts/3' text: emphasis + word_items_ids: [] - children: [] content_layer: body formatting: bold: true italic: false + script: baseline strikethrough: false underline: false label: text @@ -341,11 +349,13 @@ texts: prov: [] self_ref: '#/texts/4' text: strong emphasis + word_items_ids: [] - children: [] content_layer: body formatting: bold: true italic: true + script: baseline strikethrough: false underline: false label: text @@ -355,6 +365,7 @@ texts: prov: [] self_ref: '#/texts/5' text: both + word_items_ids: [] - children: [] content_layer: body label: text @@ -364,6 +375,7 @@ texts: prov: [] self_ref: '#/texts/6' text: . + word_items_ids: [] - children: [] content_layer: body label: text @@ -373,6 +385,7 @@ texts: prov: [] self_ref: '#/texts/7' text: 'Create your feature branch:' + word_items_ids: [] - captions: [] children: [] code_language: unknown @@ -386,6 +399,7 @@ texts: references: [] self_ref: '#/texts/8' text: git checkout -b feature/AmazingFeature + word_items_ids: [] - children: [] content_layer: body label: text @@ -395,6 +409,7 @@ texts: prov: [] self_ref: '#/texts/9' text: . + word_items_ids: [] - children: - $ref: '#/groups/3' content_layer: body @@ -407,6 +422,7 @@ texts: prov: [] self_ref: '#/texts/10' text: '' + word_items_ids: [] - children: [] content_layer: body label: text @@ -416,11 +432,13 @@ texts: prov: [] self_ref: '#/texts/11' text: Pull the + word_items_ids: [] - children: [] content_layer: body formatting: bold: true italic: false + script: baseline strikethrough: false underline: false hyperlink: https://github.com/docling-project/docling @@ -431,6 +449,7 @@ texts: prov: [] self_ref: '#/texts/12' text: repository + word_items_ids: [] - children: [] content_layer: body label: text @@ -440,6 +459,7 @@ texts: prov: [] self_ref: '#/texts/13' text: . + word_items_ids: [] - children: - $ref: '#/groups/4' content_layer: body @@ -452,6 +472,7 @@ texts: prov: [] self_ref: '#/texts/14' text: '' + word_items_ids: [] - children: [] content_layer: body label: text @@ -461,6 +482,7 @@ texts: prov: [] self_ref: '#/texts/15' text: Create your feature branch ( + word_items_ids: [] - captions: [] children: [] code_language: unknown @@ -474,6 +496,7 @@ texts: references: [] self_ref: '#/texts/16' text: git checkout -b feature/AmazingFeature + word_items_ids: [] - children: [] content_layer: body label: text @@ -483,6 +506,7 @@ texts: prov: [] self_ref: '#/texts/17' text: ) + word_items_ids: [] - children: - $ref: '#/groups/5' content_layer: body @@ -495,6 +519,7 @@ texts: prov: [] self_ref: '#/texts/18' text: '' + word_items_ids: [] - children: [] content_layer: body label: text @@ -504,6 +529,7 @@ texts: prov: [] self_ref: '#/texts/19' text: Commit your changes ( + word_items_ids: [] - captions: [] children: [] code_language: unknown @@ -517,6 +543,7 @@ texts: references: [] self_ref: '#/texts/20' text: git commit -m 'Add some AmazingFeature' + word_items_ids: [] - children: [] content_layer: body label: text @@ -526,6 +553,7 @@ texts: prov: [] self_ref: '#/texts/21' text: ) + word_items_ids: [] - children: - $ref: '#/groups/6' content_layer: body @@ -538,6 +566,7 @@ texts: prov: [] self_ref: '#/texts/22' text: '' + word_items_ids: [] - children: [] content_layer: body label: text @@ -547,6 +576,7 @@ texts: prov: [] self_ref: '#/texts/23' text: Push to the branch ( + word_items_ids: [] - captions: [] children: [] code_language: unknown @@ -560,6 +590,7 @@ texts: references: [] self_ref: '#/texts/24' text: git push origin feature/AmazingFeature + word_items_ids: [] - children: [] content_layer: body label: text @@ -569,6 +600,7 @@ texts: prov: [] self_ref: '#/texts/25' text: ) + word_items_ids: [] - children: [] content_layer: body enumerated: true @@ -580,6 +612,7 @@ texts: prov: [] self_ref: '#/texts/26' text: Open a Pull Request + word_items_ids: [] - children: - $ref: '#/groups/7' content_layer: body @@ -591,11 +624,13 @@ texts: prov: [] self_ref: '#/texts/27' text: '' + word_items_ids: [] - children: [] content_layer: body formatting: bold: false italic: true + script: baseline strikethrough: false underline: false label: text @@ -605,6 +640,7 @@ texts: prov: [] self_ref: '#/texts/28' text: Second + word_items_ids: [] - children: [] content_layer: body label: text @@ -614,6 +650,7 @@ texts: prov: [] self_ref: '#/texts/29' text: section + word_items_ids: [] - children: - $ref: '#/groups/9' content_layer: body @@ -626,11 +663,13 @@ texts: prov: [] self_ref: '#/texts/30' text: '' + word_items_ids: [] - children: [] content_layer: body formatting: bold: true italic: false + script: baseline strikethrough: false underline: false label: text @@ -640,6 +679,7 @@ texts: prov: [] self_ref: '#/texts/31' text: First + word_items_ids: [] - children: [] content_layer: body label: text @@ -649,6 +689,7 @@ texts: prov: [] self_ref: '#/texts/32' text: ': Lorem ipsum.' + word_items_ids: [] - children: - $ref: '#/groups/10' content_layer: body @@ -661,11 +702,13 @@ texts: prov: [] self_ref: '#/texts/33' text: '' + word_items_ids: [] - children: [] content_layer: body formatting: bold: true italic: false + script: baseline strikethrough: false underline: false label: text @@ -675,6 +718,7 @@ texts: prov: [] self_ref: '#/texts/34' text: Second + word_items_ids: [] - children: [] content_layer: body label: text @@ -684,6 +728,7 @@ texts: prov: [] self_ref: '#/texts/35' text: ': Dolor' + word_items_ids: [] - captions: [] children: [] code_language: unknown @@ -697,6 +742,7 @@ texts: references: [] self_ref: '#/texts/36' text: sit + word_items_ids: [] - children: [] content_layer: body label: text @@ -706,4 +752,5 @@ texts: prov: [] self_ref: '#/texts/37' text: amet. -version: 1.3.0 \ No newline at end of file + word_items_ids: [] +version: 1.4.0