Files
docling/tests/data/groundtruth/docling_v2/webvtt_example_01.vtt.json
Panos Vagenas 55908d6bb4 chore: pretest docling-core 2.51.0
Signed-off-by: Panos Vagenas <pva@zurich.ibm.com>
2025-11-12 16:35:49 +01:00

1074 lines
22 KiB
JSON
Vendored
Raw Blame History

This file contains ambiguous Unicode characters
This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
{
"schema_name": "DoclingDocument",
"version": "1.8.0",
"name": "webvtt_example_01",
"origin": {
"mimetype": "text/vtt",
"binary_hash": 16887312431371817791,
"filename": "webvtt_example_01.vtt"
},
"furniture": {
"self_ref": "#/furniture",
"children": [],
"content_layer": "furniture",
"name": "_root_",
"label": "unspecified"
},
"body": {
"self_ref": "#/body",
"children": [
{
"$ref": "#/groups/0"
},
{
"$ref": "#/groups/2"
},
{
"$ref": "#/groups/4"
},
{
"$ref": "#/groups/6"
},
{
"$ref": "#/groups/8"
},
{
"$ref": "#/groups/10"
},
{
"$ref": "#/groups/12"
},
{
"$ref": "#/groups/14"
},
{
"$ref": "#/groups/16"
},
{
"$ref": "#/groups/18"
},
{
"$ref": "#/groups/20"
},
{
"$ref": "#/groups/22"
},
{
"$ref": "#/groups/24"
}
],
"content_layer": "body",
"name": "_root_",
"label": "unspecified"
},
"groups": [
{
"self_ref": "#/groups/0",
"parent": {
"$ref": "#/body"
},
"children": [
{
"$ref": "#/texts/0"
},
{
"$ref": "#/groups/1"
}
],
"content_layer": "body",
"name": "WebVTT cue block",
"label": "section"
},
{
"self_ref": "#/groups/1",
"parent": {
"$ref": "#/groups/0"
},
"children": [
{
"$ref": "#/texts/1"
},
{
"$ref": "#/texts/2"
}
],
"content_layer": "body",
"name": "WebVTT cue voice span",
"label": "inline"
},
{
"self_ref": "#/groups/2",
"parent": {
"$ref": "#/body"
},
"children": [
{
"$ref": "#/texts/3"
},
{
"$ref": "#/groups/3"
}
],
"content_layer": "body",
"name": "WebVTT cue block",
"label": "section"
},
{
"self_ref": "#/groups/3",
"parent": {
"$ref": "#/groups/2"
},
"children": [
{
"$ref": "#/texts/4"
},
{
"$ref": "#/texts/5"
}
],
"content_layer": "body",
"name": "WebVTT cue voice span",
"label": "inline"
},
{
"self_ref": "#/groups/4",
"parent": {
"$ref": "#/body"
},
"children": [
{
"$ref": "#/texts/6"
},
{
"$ref": "#/groups/5"
}
],
"content_layer": "body",
"name": "WebVTT cue block",
"label": "section"
},
{
"self_ref": "#/groups/5",
"parent": {
"$ref": "#/groups/4"
},
"children": [
{
"$ref": "#/texts/7"
},
{
"$ref": "#/texts/8"
}
],
"content_layer": "body",
"name": "WebVTT cue voice span",
"label": "inline"
},
{
"self_ref": "#/groups/6",
"parent": {
"$ref": "#/body"
},
"children": [
{
"$ref": "#/texts/9"
},
{
"$ref": "#/groups/7"
}
],
"content_layer": "body",
"name": "WebVTT cue block",
"label": "section"
},
{
"self_ref": "#/groups/7",
"parent": {
"$ref": "#/groups/6"
},
"children": [
{
"$ref": "#/texts/10"
},
{
"$ref": "#/texts/11"
}
],
"content_layer": "body",
"name": "WebVTT cue voice span",
"label": "inline"
},
{
"self_ref": "#/groups/8",
"parent": {
"$ref": "#/body"
},
"children": [
{
"$ref": "#/texts/12"
},
{
"$ref": "#/groups/9"
}
],
"content_layer": "body",
"name": "WebVTT cue block",
"label": "section"
},
{
"self_ref": "#/groups/9",
"parent": {
"$ref": "#/groups/8"
},
"children": [
{
"$ref": "#/texts/13"
},
{
"$ref": "#/texts/14"
}
],
"content_layer": "body",
"name": "WebVTT cue voice span",
"label": "inline"
},
{
"self_ref": "#/groups/10",
"parent": {
"$ref": "#/body"
},
"children": [
{
"$ref": "#/texts/15"
},
{
"$ref": "#/groups/11"
}
],
"content_layer": "body",
"name": "WebVTT cue block",
"label": "section"
},
{
"self_ref": "#/groups/11",
"parent": {
"$ref": "#/groups/10"
},
"children": [
{
"$ref": "#/texts/16"
},
{
"$ref": "#/texts/17"
}
],
"content_layer": "body",
"name": "WebVTT cue voice span",
"label": "inline"
},
{
"self_ref": "#/groups/12",
"parent": {
"$ref": "#/body"
},
"children": [
{
"$ref": "#/texts/18"
},
{
"$ref": "#/groups/13"
}
],
"content_layer": "body",
"name": "WebVTT cue block",
"label": "section"
},
{
"self_ref": "#/groups/13",
"parent": {
"$ref": "#/groups/12"
},
"children": [
{
"$ref": "#/texts/19"
},
{
"$ref": "#/texts/20"
}
],
"content_layer": "body",
"name": "WebVTT cue voice span",
"label": "inline"
},
{
"self_ref": "#/groups/14",
"parent": {
"$ref": "#/body"
},
"children": [
{
"$ref": "#/texts/21"
},
{
"$ref": "#/groups/15"
}
],
"content_layer": "body",
"name": "WebVTT cue block",
"label": "section"
},
{
"self_ref": "#/groups/15",
"parent": {
"$ref": "#/groups/14"
},
"children": [
{
"$ref": "#/texts/22"
},
{
"$ref": "#/texts/23"
}
],
"content_layer": "body",
"name": "WebVTT cue voice span",
"label": "inline"
},
{
"self_ref": "#/groups/16",
"parent": {
"$ref": "#/body"
},
"children": [
{
"$ref": "#/texts/24"
},
{
"$ref": "#/groups/17"
}
],
"content_layer": "body",
"name": "WebVTT cue block",
"label": "section"
},
{
"self_ref": "#/groups/17",
"parent": {
"$ref": "#/groups/16"
},
"children": [
{
"$ref": "#/texts/25"
},
{
"$ref": "#/texts/26"
}
],
"content_layer": "body",
"name": "WebVTT cue voice span",
"label": "inline"
},
{
"self_ref": "#/groups/18",
"parent": {
"$ref": "#/body"
},
"children": [
{
"$ref": "#/texts/27"
},
{
"$ref": "#/groups/19"
}
],
"content_layer": "body",
"name": "WebVTT cue block",
"label": "section"
},
{
"self_ref": "#/groups/19",
"parent": {
"$ref": "#/groups/18"
},
"children": [
{
"$ref": "#/texts/28"
},
{
"$ref": "#/texts/29"
}
],
"content_layer": "body",
"name": "WebVTT cue voice span",
"label": "inline"
},
{
"self_ref": "#/groups/20",
"parent": {
"$ref": "#/body"
},
"children": [
{
"$ref": "#/texts/30"
},
{
"$ref": "#/groups/21"
}
],
"content_layer": "body",
"name": "WebVTT cue block",
"label": "section"
},
{
"self_ref": "#/groups/21",
"parent": {
"$ref": "#/groups/20"
},
"children": [
{
"$ref": "#/texts/31"
},
{
"$ref": "#/texts/32"
}
],
"content_layer": "body",
"name": "WebVTT cue voice span",
"label": "inline"
},
{
"self_ref": "#/groups/22",
"parent": {
"$ref": "#/body"
},
"children": [
{
"$ref": "#/texts/33"
},
{
"$ref": "#/groups/23"
}
],
"content_layer": "body",
"name": "WebVTT cue block",
"label": "section"
},
{
"self_ref": "#/groups/23",
"parent": {
"$ref": "#/groups/22"
},
"children": [
{
"$ref": "#/texts/34"
},
{
"$ref": "#/texts/35"
}
],
"content_layer": "body",
"name": "WebVTT cue voice span",
"label": "inline"
},
{
"self_ref": "#/groups/24",
"parent": {
"$ref": "#/body"
},
"children": [
{
"$ref": "#/texts/36"
},
{
"$ref": "#/groups/25"
}
],
"content_layer": "body",
"name": "WebVTT cue block",
"label": "section"
},
{
"self_ref": "#/groups/25",
"parent": {
"$ref": "#/groups/24"
},
"children": [
{
"$ref": "#/texts/37"
},
{
"$ref": "#/texts/38"
}
],
"content_layer": "body",
"name": "WebVTT cue voice span",
"label": "inline"
}
],
"texts": [
{
"self_ref": "#/texts/0",
"parent": {
"$ref": "#/groups/0"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "00:11.000 --> 00:13.000",
"text": "00:11.000 --> 00:13.000"
},
{
"self_ref": "#/texts/1",
"parent": {
"$ref": "#/groups/1"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Roger Bingham: ",
"text": "Roger Bingham: "
},
{
"self_ref": "#/texts/2",
"parent": {
"$ref": "#/groups/1"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "We are in New York City",
"text": "We are in New York City",
"formatting": {
"bold": false,
"italic": false,
"underline": false,
"strikethrough": false,
"script": "baseline"
}
},
{
"self_ref": "#/texts/3",
"parent": {
"$ref": "#/groups/2"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "00:13.000 --> 00:16.000",
"text": "00:13.000 --> 00:16.000"
},
{
"self_ref": "#/texts/4",
"parent": {
"$ref": "#/groups/3"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Roger Bingham: ",
"text": "Roger Bingham: "
},
{
"self_ref": "#/texts/5",
"parent": {
"$ref": "#/groups/3"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Were actually at the Lucern Hotel, just down the street",
"text": "Were actually at the Lucern Hotel, just down the street",
"formatting": {
"bold": false,
"italic": false,
"underline": false,
"strikethrough": false,
"script": "baseline"
}
},
{
"self_ref": "#/texts/6",
"parent": {
"$ref": "#/groups/4"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "00:16.000 --> 00:18.000",
"text": "00:16.000 --> 00:18.000"
},
{
"self_ref": "#/texts/7",
"parent": {
"$ref": "#/groups/5"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Roger Bingham: ",
"text": "Roger Bingham: "
},
{
"self_ref": "#/texts/8",
"parent": {
"$ref": "#/groups/5"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "from the American Museum of Natural History",
"text": "from the American Museum of Natural History",
"formatting": {
"bold": false,
"italic": false,
"underline": false,
"strikethrough": false,
"script": "baseline"
}
},
{
"self_ref": "#/texts/9",
"parent": {
"$ref": "#/groups/6"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "00:18.000 --> 00:20.000",
"text": "00:18.000 --> 00:20.000"
},
{
"self_ref": "#/texts/10",
"parent": {
"$ref": "#/groups/7"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Roger Bingham: ",
"text": "Roger Bingham: "
},
{
"self_ref": "#/texts/11",
"parent": {
"$ref": "#/groups/7"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "And with me is Neil deGrasse Tyson",
"text": "And with me is Neil deGrasse Tyson",
"formatting": {
"bold": false,
"italic": false,
"underline": false,
"strikethrough": false,
"script": "baseline"
}
},
{
"self_ref": "#/texts/12",
"parent": {
"$ref": "#/groups/8"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "00:20.000 --> 00:22.000",
"text": "00:20.000 --> 00:22.000"
},
{
"self_ref": "#/texts/13",
"parent": {
"$ref": "#/groups/9"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Roger Bingham: ",
"text": "Roger Bingham: "
},
{
"self_ref": "#/texts/14",
"parent": {
"$ref": "#/groups/9"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Astrophysicist, Director of the Hayden Planetarium",
"text": "Astrophysicist, Director of the Hayden Planetarium",
"formatting": {
"bold": false,
"italic": false,
"underline": false,
"strikethrough": false,
"script": "baseline"
}
},
{
"self_ref": "#/texts/15",
"parent": {
"$ref": "#/groups/10"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "00:22.000 --> 00:24.000",
"text": "00:22.000 --> 00:24.000"
},
{
"self_ref": "#/texts/16",
"parent": {
"$ref": "#/groups/11"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Roger Bingham: ",
"text": "Roger Bingham: "
},
{
"self_ref": "#/texts/17",
"parent": {
"$ref": "#/groups/11"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "at the AMNH.",
"text": "at the AMNH.",
"formatting": {
"bold": false,
"italic": false,
"underline": false,
"strikethrough": false,
"script": "baseline"
}
},
{
"self_ref": "#/texts/18",
"parent": {
"$ref": "#/groups/12"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "00:24.000 --> 00:26.000",
"text": "00:24.000 --> 00:26.000"
},
{
"self_ref": "#/texts/19",
"parent": {
"$ref": "#/groups/13"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Roger Bingham: ",
"text": "Roger Bingham: "
},
{
"self_ref": "#/texts/20",
"parent": {
"$ref": "#/groups/13"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Thank you for walking down here.",
"text": "Thank you for walking down here.",
"formatting": {
"bold": false,
"italic": false,
"underline": false,
"strikethrough": false,
"script": "baseline"
}
},
{
"self_ref": "#/texts/21",
"parent": {
"$ref": "#/groups/14"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "00:27.000 --> 00:30.000",
"text": "00:27.000 --> 00:30.000"
},
{
"self_ref": "#/texts/22",
"parent": {
"$ref": "#/groups/15"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Roger Bingham: ",
"text": "Roger Bingham: "
},
{
"self_ref": "#/texts/23",
"parent": {
"$ref": "#/groups/15"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "And I want to do a follow-up on the last conversation we did.",
"text": "And I want to do a follow-up on the last conversation we did.",
"formatting": {
"bold": false,
"italic": false,
"underline": false,
"strikethrough": false,
"script": "baseline"
}
},
{
"self_ref": "#/texts/24",
"parent": {
"$ref": "#/groups/16"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "00:30.000 --> 00:31.500",
"text": "00:30.000 --> 00:31.500"
},
{
"self_ref": "#/texts/25",
"parent": {
"$ref": "#/groups/17"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Roger Bingham: ",
"text": "Roger Bingham: "
},
{
"self_ref": "#/texts/26",
"parent": {
"$ref": "#/groups/17"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "When we e-mailed—",
"text": "When we e-mailed—",
"formatting": {
"bold": false,
"italic": false,
"underline": false,
"strikethrough": false,
"script": "baseline"
}
},
{
"self_ref": "#/texts/27",
"parent": {
"$ref": "#/groups/18"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "00:30.500 --> 00:32.500",
"text": "00:30.500 --> 00:32.500"
},
{
"self_ref": "#/texts/28",
"parent": {
"$ref": "#/groups/19"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Neil deGrasse Tyson: ",
"text": "Neil deGrasse Tyson: "
},
{
"self_ref": "#/texts/29",
"parent": {
"$ref": "#/groups/19"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Didnt we talk about enough in that conversation?",
"text": "Didnt we talk about enough in that conversation?",
"formatting": {
"bold": false,
"italic": false,
"underline": false,
"strikethrough": false,
"script": "baseline"
}
},
{
"self_ref": "#/texts/30",
"parent": {
"$ref": "#/groups/20"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "00:32.000 --> 00:35.500",
"text": "00:32.000 --> 00:35.500"
},
{
"self_ref": "#/texts/31",
"parent": {
"$ref": "#/groups/21"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Roger Bingham: ",
"text": "Roger Bingham: "
},
{
"self_ref": "#/texts/32",
"parent": {
"$ref": "#/groups/21"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "No! No no no no; 'cos 'cos obviously 'cos",
"text": "No! No no no no; 'cos 'cos obviously 'cos",
"formatting": {
"bold": false,
"italic": false,
"underline": false,
"strikethrough": false,
"script": "baseline"
}
},
{
"self_ref": "#/texts/33",
"parent": {
"$ref": "#/groups/22"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "00:32.500 --> 00:33.500",
"text": "00:32.500 --> 00:33.500"
},
{
"self_ref": "#/texts/34",
"parent": {
"$ref": "#/groups/23"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Neil deGrasse Tyson: ",
"text": "Neil deGrasse Tyson: "
},
{
"self_ref": "#/texts/35",
"parent": {
"$ref": "#/groups/23"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Laughs",
"text": "Laughs",
"formatting": {
"bold": false,
"italic": true,
"underline": false,
"strikethrough": false,
"script": "baseline"
}
},
{
"self_ref": "#/texts/36",
"parent": {
"$ref": "#/groups/24"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "00:35.500 --> 00:38.000",
"text": "00:35.500 --> 00:38.000"
},
{
"self_ref": "#/texts/37",
"parent": {
"$ref": "#/groups/25"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "Roger Bingham: ",
"text": "Roger Bingham: "
},
{
"self_ref": "#/texts/38",
"parent": {
"$ref": "#/groups/25"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [],
"orig": "You know Im so excited my glasses are falling off here.",
"text": "You know Im so excited my glasses are falling off here.",
"formatting": {
"bold": false,
"italic": false,
"underline": false,
"strikethrough": false,
"script": "baseline"
}
}
],
"pictures": [],
"tables": [],
"key_value_items": [],
"form_items": [],
"pages": {}
}