From 31056d10e440238de22d045f62ce781169221223 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?V=C3=A1clav=20Van=C4=8Dura?= Date: Wed, 5 Feb 2025 10:50:08 +0100 Subject: [PATCH] Actor: Fixing example PDF document URLs MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: Václav Vančura --- .actor/README.md | 8 ++++---- .actor/input_schema.json | 2 +- 2 files changed, 5 insertions(+), 5 deletions(-) diff --git a/.actor/README.md b/.actor/README.md index d899e0d4..a51c4d11 100644 --- a/.actor/README.md +++ b/.actor/README.md @@ -54,7 +54,7 @@ curl --request POST \ --header 'Content-Type: application/json' \ --header 'Authorization: Bearer YOUR_API_TOKEN' \ --data '{ - "documentUrl": "https://example.com/document.pdf", + "documentUrl": "https://arxiv.org/pdf/2408.09869.pdf", "outputFormat": "md", "ocr": true }' @@ -63,8 +63,8 @@ curl --request POST \ ### Using Apify CLI ```bash -apify call username/actorname --input='{ - "documentUrl": "https://example.com/file.pdf", +$ apify call username/actorname --input='{ + "documentUrl": "https://arxiv.org/pdf/2408.09869.pdf", "outputFormat": "md", "ocr": true }' @@ -84,7 +84,7 @@ The Actor accepts a JSON schema matching the file `.actor/input_schema.json`. Be ```json { - "documentUrl": "https://some-website.com/document.pdf", + "documentUrl": "https://arxiv.org/pdf/2408.09869.pdf", "outputFormat": "md", "ocr": false } diff --git a/.actor/input_schema.json b/.actor/input_schema.json index 9c7c4031..f58ef1f1 100644 --- a/.actor/input_schema.json +++ b/.actor/input_schema.json @@ -8,7 +8,7 @@ "title": "Document URL", "type": "string", "description": "URL of the document to process with Docling. Supported formats: images, 'pdf', 'docx', 'pptx', 'xlsx, 'html', 'md', 'xml_pubmed', 'asciidoc', 'xml_uspto'.", - "prefill": "https://vancura.dev/assets/actor-test/facial-hairstyles-and-filtering-facepiece-respirators.pdf", + "prefill": "https://arxiv.org/pdf/2408.09869.pdf", "editor": "textfield" }, "outputFormat": {