mirror of
https://github.com/DS4SD/docling.git
synced 2025-07-26 03:55:00 +00:00
fix: Disable the TOKENIZERS_PARALLELISM in test_e2e_ocr_conversion.py to avoid warning messages from HF
Signed-off-by: Nikos Livathinos <nli@zurich.ibm.com>
This commit is contained in:
parent
75db61127c
commit
dadff50589
@ -1,3 +1,4 @@
|
||||
import os
|
||||
import sys
|
||||
from pathlib import Path
|
||||
from typing import List
|
||||
@ -53,6 +54,12 @@ def get_converter(ocr_options: OcrOptions):
|
||||
|
||||
|
||||
def test_e2e_conversions():
|
||||
r"""
|
||||
End-to-end conversions with OCR
|
||||
"""
|
||||
# Disable parallelisation for HF tokenizers to avoid warning messages
|
||||
os.environ["TOKENIZERS_PARALLELISM"] = "false"
|
||||
|
||||
pdf_paths = get_pdf_paths()
|
||||
|
||||
engines: List[OcrOptions] = [
|
||||
|
Loading…
Reference in New Issue
Block a user