mirror of
https://github.com/DS4SD/docling.git
synced 2025-12-10 13:48:13 +00:00
More elegant solution in removing the input prompt
Signed-off-by: Maksym Lysak <mly@zurich.ibm.com>
This commit is contained in:
@@ -117,17 +117,12 @@ class SmolDoclingModel(BasePageModel):
|
|||||||
)
|
)
|
||||||
|
|
||||||
generation_time = time.time() - start_time
|
generation_time = time.time() - start_time
|
||||||
|
|
||||||
generated_texts = self.processor.batch_decode(
|
generated_texts = self.processor.batch_decode(
|
||||||
generated_ids, skip_special_tokens=False
|
generated_ids[:, inputs["input_ids"].shape[1] :],
|
||||||
|
skip_special_tokens=False,
|
||||||
)[0]
|
)[0]
|
||||||
|
|
||||||
num_tokens = len(generated_ids[0])
|
num_tokens = len(generated_ids[0])
|
||||||
# DELETE NOISE BEFORE "Assistant: "
|
|
||||||
starting_point = "Assistant: "
|
|
||||||
generated_texts = generated_texts[
|
|
||||||
generated_texts.index(starting_point) + len(starting_point) :
|
|
||||||
]
|
|
||||||
# generated_texts = generated_texts.replace("Assistant: ", "")
|
|
||||||
page_tags = generated_texts
|
page_tags = generated_texts
|
||||||
|
|
||||||
inference_time = time.time() - start_time
|
inference_time = time.time() - start_time
|
||||||
|
|||||||
Reference in New Issue
Block a user