mirror of
https://github.com/DS4SD/docling.git
synced 2025-08-02 15:32:30 +00:00
chore: remove type-ignore marks for attaching text to non GroupItems
After commit b74208 of docling-core, text items can be attached to any NodeItem and therefore the ignore[arg-type] type marks can be removed. Signed-off-by: Cesar Berrospi Ramis <75900930+ceberam@users.noreply.github.com>
This commit is contained in:
parent
e9768ae6a5
commit
82168f946c
@ -389,7 +389,7 @@ class PatentUsptoIce(PatentUspto):
|
|||||||
if name == self.Element.TITLE.value:
|
if name == self.Element.TITLE.value:
|
||||||
if text:
|
if text:
|
||||||
self.parents[self.level + 1] = self.doc.add_title(
|
self.parents[self.level + 1] = self.doc.add_title(
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
text=text,
|
text=text,
|
||||||
)
|
)
|
||||||
self.level += 1
|
self.level += 1
|
||||||
@ -406,7 +406,7 @@ class PatentUsptoIce(PatentUspto):
|
|||||||
abstract_item = self.doc.add_heading(
|
abstract_item = self.doc.add_heading(
|
||||||
heading_text,
|
heading_text,
|
||||||
level=heading_level,
|
level=heading_level,
|
||||||
parent=self.parents[heading_level], # type: ignore[arg-type]
|
parent=self.parents[heading_level],
|
||||||
)
|
)
|
||||||
self.doc.add_text(
|
self.doc.add_text(
|
||||||
label=DocItemLabel.PARAGRAPH,
|
label=DocItemLabel.PARAGRAPH,
|
||||||
@ -434,7 +434,7 @@ class PatentUsptoIce(PatentUspto):
|
|||||||
claims_item = self.doc.add_heading(
|
claims_item = self.doc.add_heading(
|
||||||
heading_text,
|
heading_text,
|
||||||
level=heading_level,
|
level=heading_level,
|
||||||
parent=self.parents[heading_level], # type: ignore[arg-type]
|
parent=self.parents[heading_level],
|
||||||
)
|
)
|
||||||
for text in self.claims:
|
for text in self.claims:
|
||||||
self.doc.add_text(
|
self.doc.add_text(
|
||||||
@ -452,7 +452,7 @@ class PatentUsptoIce(PatentUspto):
|
|||||||
self.doc.add_text(
|
self.doc.add_text(
|
||||||
label=DocItemLabel.PARAGRAPH,
|
label=DocItemLabel.PARAGRAPH,
|
||||||
text=text,
|
text=text,
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
self.text = ""
|
self.text = ""
|
||||||
|
|
||||||
@ -460,7 +460,7 @@ class PatentUsptoIce(PatentUspto):
|
|||||||
self.parents[self.level + 1] = self.doc.add_heading(
|
self.parents[self.level + 1] = self.doc.add_heading(
|
||||||
text=text,
|
text=text,
|
||||||
level=self.level,
|
level=self.level,
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
self.level += 1
|
self.level += 1
|
||||||
self.text = ""
|
self.text = ""
|
||||||
@ -470,7 +470,7 @@ class PatentUsptoIce(PatentUspto):
|
|||||||
empty_table = TableData(num_rows=0, num_cols=0, table_cells=[])
|
empty_table = TableData(num_rows=0, num_cols=0, table_cells=[])
|
||||||
self.doc.add_table(
|
self.doc.add_table(
|
||||||
data=empty_table,
|
data=empty_table,
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
|
|
||||||
def _apply_style(self, text: str, style_tag: str) -> str:
|
def _apply_style(self, text: str, style_tag: str) -> str:
|
||||||
@ -721,7 +721,7 @@ class PatentUsptoGrantV2(PatentUspto):
|
|||||||
if self.Element.TITLE.value in self.property and text.strip():
|
if self.Element.TITLE.value in self.property and text.strip():
|
||||||
title = text.strip()
|
title = text.strip()
|
||||||
self.parents[self.level + 1] = self.doc.add_title(
|
self.parents[self.level + 1] = self.doc.add_title(
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
text=title,
|
text=title,
|
||||||
)
|
)
|
||||||
self.level += 1
|
self.level += 1
|
||||||
@ -749,7 +749,7 @@ class PatentUsptoGrantV2(PatentUspto):
|
|||||||
self.parents[self.level + 1] = self.doc.add_heading(
|
self.parents[self.level + 1] = self.doc.add_heading(
|
||||||
text=text.strip(),
|
text=text.strip(),
|
||||||
level=self.level,
|
level=self.level,
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
self.level += 1
|
self.level += 1
|
||||||
|
|
||||||
@ -769,7 +769,7 @@ class PatentUsptoGrantV2(PatentUspto):
|
|||||||
claims_item = self.doc.add_heading(
|
claims_item = self.doc.add_heading(
|
||||||
heading_text,
|
heading_text,
|
||||||
level=heading_level,
|
level=heading_level,
|
||||||
parent=self.parents[heading_level], # type: ignore[arg-type]
|
parent=self.parents[heading_level],
|
||||||
)
|
)
|
||||||
for text in self.claims:
|
for text in self.claims:
|
||||||
self.doc.add_text(
|
self.doc.add_text(
|
||||||
@ -787,7 +787,7 @@ class PatentUsptoGrantV2(PatentUspto):
|
|||||||
abstract_item = self.doc.add_heading(
|
abstract_item = self.doc.add_heading(
|
||||||
heading_text,
|
heading_text,
|
||||||
level=heading_level,
|
level=heading_level,
|
||||||
parent=self.parents[heading_level], # type: ignore[arg-type]
|
parent=self.parents[heading_level],
|
||||||
)
|
)
|
||||||
self.doc.add_text(
|
self.doc.add_text(
|
||||||
label=DocItemLabel.PARAGRAPH, text=abstract, parent=abstract_item
|
label=DocItemLabel.PARAGRAPH, text=abstract, parent=abstract_item
|
||||||
@ -799,7 +799,7 @@ class PatentUsptoGrantV2(PatentUspto):
|
|||||||
self.doc.add_text(
|
self.doc.add_text(
|
||||||
label=DocItemLabel.PARAGRAPH,
|
label=DocItemLabel.PARAGRAPH,
|
||||||
text=paragraph,
|
text=paragraph,
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
elif self.Element.CLAIM.value in self.property:
|
elif self.Element.CLAIM.value in self.property:
|
||||||
# we may need a space after a paragraph in claim text
|
# we may need a space after a paragraph in claim text
|
||||||
@ -811,7 +811,7 @@ class PatentUsptoGrantV2(PatentUspto):
|
|||||||
empty_table = TableData(num_rows=0, num_cols=0, table_cells=[])
|
empty_table = TableData(num_rows=0, num_cols=0, table_cells=[])
|
||||||
self.doc.add_table(
|
self.doc.add_table(
|
||||||
data=empty_table,
|
data=empty_table,
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
|
|
||||||
def _apply_style(self, text: str, style_tag: str) -> str:
|
def _apply_style(self, text: str, style_tag: str) -> str:
|
||||||
@ -938,7 +938,7 @@ class PatentUsptoGrantAps(PatentUspto):
|
|||||||
self.parents[self.level + 1] = self.doc.add_heading(
|
self.parents[self.level + 1] = self.doc.add_heading(
|
||||||
heading.value,
|
heading.value,
|
||||||
level=self.level,
|
level=self.level,
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
self.level += 1
|
self.level += 1
|
||||||
|
|
||||||
@ -959,7 +959,7 @@ class PatentUsptoGrantAps(PatentUspto):
|
|||||||
|
|
||||||
if field == self.Field.TITLE.value:
|
if field == self.Field.TITLE.value:
|
||||||
self.parents[self.level + 1] = self.doc.add_title(
|
self.parents[self.level + 1] = self.doc.add_title(
|
||||||
parent=self.parents[self.level], text=value # type: ignore[arg-type]
|
parent=self.parents[self.level], text=value
|
||||||
)
|
)
|
||||||
self.level += 1
|
self.level += 1
|
||||||
|
|
||||||
@ -971,14 +971,14 @@ class PatentUsptoGrantAps(PatentUspto):
|
|||||||
self.doc.add_text(
|
self.doc.add_text(
|
||||||
label=DocItemLabel.PARAGRAPH,
|
label=DocItemLabel.PARAGRAPH,
|
||||||
text=value,
|
text=value,
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
|
|
||||||
elif field == self.Field.NUMBER.value and section == self.Section.CLAIMS.value:
|
elif field == self.Field.NUMBER.value and section == self.Section.CLAIMS.value:
|
||||||
self.doc.add_text(
|
self.doc.add_text(
|
||||||
label=DocItemLabel.PARAGRAPH,
|
label=DocItemLabel.PARAGRAPH,
|
||||||
text="",
|
text="",
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
|
|
||||||
elif (
|
elif (
|
||||||
@ -996,7 +996,7 @@ class PatentUsptoGrantAps(PatentUspto):
|
|||||||
last_claim = self.doc.add_text(
|
last_claim = self.doc.add_text(
|
||||||
label=DocItemLabel.PARAGRAPH,
|
label=DocItemLabel.PARAGRAPH,
|
||||||
text="",
|
text="",
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
|
|
||||||
last_claim.text += f" {value}" if last_claim.text else value
|
last_claim.text += f" {value}" if last_claim.text else value
|
||||||
@ -1012,7 +1012,7 @@ class PatentUsptoGrantAps(PatentUspto):
|
|||||||
self.parents[self.level + 1] = self.doc.add_heading(
|
self.parents[self.level + 1] = self.doc.add_heading(
|
||||||
value,
|
value,
|
||||||
level=self.level,
|
level=self.level,
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
self.level += 1
|
self.level += 1
|
||||||
|
|
||||||
@ -1029,7 +1029,7 @@ class PatentUsptoGrantAps(PatentUspto):
|
|||||||
self.doc.add_text(
|
self.doc.add_text(
|
||||||
label=DocItemLabel.PARAGRAPH,
|
label=DocItemLabel.PARAGRAPH,
|
||||||
text=value,
|
text=value,
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
|
|
||||||
def parse(self, patent_content: str) -> Optional[DoclingDocument]:
|
def parse(self, patent_content: str) -> Optional[DoclingDocument]:
|
||||||
@ -1283,7 +1283,7 @@ class PatentUsptoAppV1(PatentUspto):
|
|||||||
title = text.strip()
|
title = text.strip()
|
||||||
if title:
|
if title:
|
||||||
self.parents[self.level + 1] = self.doc.add_text(
|
self.parents[self.level + 1] = self.doc.add_text(
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
label=DocItemLabel.TITLE,
|
label=DocItemLabel.TITLE,
|
||||||
text=title,
|
text=title,
|
||||||
)
|
)
|
||||||
@ -1301,7 +1301,7 @@ class PatentUsptoAppV1(PatentUspto):
|
|||||||
abstract_item = self.doc.add_heading(
|
abstract_item = self.doc.add_heading(
|
||||||
heading_text,
|
heading_text,
|
||||||
level=heading_level,
|
level=heading_level,
|
||||||
parent=self.parents[heading_level], # type: ignore[arg-type]
|
parent=self.parents[heading_level],
|
||||||
)
|
)
|
||||||
self.doc.add_text(
|
self.doc.add_text(
|
||||||
label=DocItemLabel.PARAGRAPH,
|
label=DocItemLabel.PARAGRAPH,
|
||||||
@ -1331,7 +1331,7 @@ class PatentUsptoAppV1(PatentUspto):
|
|||||||
claims_item = self.doc.add_heading(
|
claims_item = self.doc.add_heading(
|
||||||
heading_text,
|
heading_text,
|
||||||
level=heading_level,
|
level=heading_level,
|
||||||
parent=self.parents[heading_level], # type: ignore[arg-type]
|
parent=self.parents[heading_level],
|
||||||
)
|
)
|
||||||
for text in self.claims:
|
for text in self.claims:
|
||||||
self.doc.add_text(
|
self.doc.add_text(
|
||||||
@ -1350,14 +1350,14 @@ class PatentUsptoAppV1(PatentUspto):
|
|||||||
self.parents[self.level + 1] = self.doc.add_heading(
|
self.parents[self.level + 1] = self.doc.add_heading(
|
||||||
text=text,
|
text=text,
|
||||||
level=self.level,
|
level=self.level,
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
self.level += 1
|
self.level += 1
|
||||||
else:
|
else:
|
||||||
self.doc.add_text(
|
self.doc.add_text(
|
||||||
label=DocItemLabel.PARAGRAPH,
|
label=DocItemLabel.PARAGRAPH,
|
||||||
text=text,
|
text=text,
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
self.text = ""
|
self.text = ""
|
||||||
|
|
||||||
@ -1366,7 +1366,7 @@ class PatentUsptoAppV1(PatentUspto):
|
|||||||
empty_table = TableData(num_rows=0, num_cols=0, table_cells=[])
|
empty_table = TableData(num_rows=0, num_cols=0, table_cells=[])
|
||||||
self.doc.add_table(
|
self.doc.add_table(
|
||||||
data=empty_table,
|
data=empty_table,
|
||||||
parent=self.parents[self.level], # type: ignore[arg-type]
|
parent=self.parents[self.level],
|
||||||
)
|
)
|
||||||
|
|
||||||
def _apply_style(self, text: str, style_tag: str) -> str:
|
def _apply_style(self, text: str, style_tag: str) -> str:
|
||||||
|
Loading…
Reference in New Issue
Block a user