Fix page_range stopping at page 32 by using dynamic batch_size

Co-authored-by: cau-git <60343111+cau-git@users.noreply.github.com>
This commit is contained in:
copilot-swe-agent[bot]
2025-11-19 13:25:00 +00:00
parent 18f705b235
commit 58fc6ccf86
2 changed files with 2 additions and 2 deletions

View File

@@ -252,7 +252,7 @@ class ThreadedLayoutVlmPipeline(BasePipeline):
proc = ProcessingResult(total_expected=total_pages)
fed_idx = 0
batch_size = 32
batch_size = total_pages
try:
while proc.success_count + proc.failure_count < total_pages:

View File

@@ -545,7 +545,7 @@ class StandardPdfPipeline(ConvertPipeline):
proc = ProcessingResult(total_expected=total_pages)
fed_idx: int = 0 # number of pages successfully queued
batch_size: int = 32 # drain chunk
batch_size: int = total_pages # drain chunk
try:
while proc.success_count + proc.failure_count < total_pages:
# 1) feed - try to enqueue until the first queue is full