mirror of
https://github.com/DS4SD/docling.git
synced 2025-12-08 12:48:28 +00:00
Add VLM task interpreters
Signed-off-by: Christoph Auer <cau@zurich.ibm.com>
This commit is contained in:
@@ -366,8 +366,6 @@ class VlmProcessingStage(ThreadedPipelineStage):
|
||||
one output item (success, empty, or failed). Non-cluster payloads are ignored.
|
||||
"""
|
||||
|
||||
print("VLM stage: ", self.task_name)
|
||||
|
||||
groups: dict[int, list[ThreadedItem]] = defaultdict(list)
|
||||
for itm in batch:
|
||||
if (
|
||||
@@ -456,8 +454,6 @@ class VlmProcessingStage(ThreadedPipelineStage):
|
||||
# 3. Interpret predictions back into page/cluster structures
|
||||
predictions_list: List[VlmPrediction] = list(vlm_predictions)
|
||||
|
||||
print("Predictions: ", predictions_list)
|
||||
|
||||
for i, (item, prediction) in enumerate(zip(item_mapping, predictions_list)):
|
||||
assert item.payload is not None
|
||||
assert isinstance(item.payload, ClusterItem)
|
||||
|
||||
Reference in New Issue
Block a user