mirror of
https://github.com/DS4SD/docling.git
synced 2025-07-30 14:04:27 +00:00
Actor: Fixed input getter
Signed-off-by: Adam Kliment <adam@netmilk.net>
This commit is contained in:
parent
1fe80d3c23
commit
7cd1f06868
@ -1,5 +1,7 @@
|
|||||||
#!/bin/bash
|
#!/bin/bash
|
||||||
|
|
||||||
|
export PATH=$PATH:/build-files/node_modules/.bin
|
||||||
|
|
||||||
# Function to upload content to the key-value store
|
# Function to upload content to the key-value store
|
||||||
upload_to_kvs() {
|
upload_to_kvs() {
|
||||||
local content_file="$1"
|
local content_file="$1"
|
||||||
@ -129,6 +131,10 @@ echo "Python version: $(python --version 2>&1)"
|
|||||||
echo "Docling-serve path: $(which docling-serve 2>/dev/null || echo 'Not found')"
|
echo "Docling-serve path: $(which docling-serve 2>/dev/null || echo 'Not found')"
|
||||||
echo "Working directory: $(pwd)"
|
echo "Working directory: $(pwd)"
|
||||||
|
|
||||||
|
# --- Get input ---
|
||||||
|
|
||||||
|
echo "Getting Apify ActorInput"
|
||||||
|
INPUT=$(apify actor get-input 2>/dev/null)
|
||||||
|
|
||||||
# --- Setup tools ---
|
# --- Setup tools ---
|
||||||
|
|
||||||
@ -283,49 +289,6 @@ DOCLING_API_ENDPOINT="http://localhost:5001/v1alpha/convert/source"
|
|||||||
echo "Starting document processing..."
|
echo "Starting document processing..."
|
||||||
echo "Reading input from Apify..."
|
echo "Reading input from Apify..."
|
||||||
|
|
||||||
# Function to handle Actor input detection
|
|
||||||
get_actor_input() {
|
|
||||||
local input=""
|
|
||||||
|
|
||||||
# Create directory if it doesn't exist
|
|
||||||
mkdir -p "/tmp/actor-input" || echo "Warning: Could not create /tmp/actor-input directory" >&2
|
|
||||||
|
|
||||||
# If /tmp/actor-input/INPUT exists as a directory, remove it
|
|
||||||
if [ -d "/tmp/actor-input/INPUT" ]; then
|
|
||||||
echo "Warning: /tmp/actor-input/INPUT exists as a directory. Removing it to create a file." >&2
|
|
||||||
rm -rf "/tmp/actor-input/INPUT"
|
|
||||||
fi
|
|
||||||
|
|
||||||
# Check multiple potential locations for input file
|
|
||||||
if [ -f "/tmp/actor-input/INPUT" ]; then
|
|
||||||
echo "Found standard Actor input file at /tmp/actor-input/INPUT" >&2
|
|
||||||
input=$(cat "/tmp/actor-input/INPUT")
|
|
||||||
elif [ -f "/input/INPUT" ]; then
|
|
||||||
echo "Found Actor input file at /input/INPUT" >&2
|
|
||||||
input=$(cat "/input/INPUT")
|
|
||||||
|
|
||||||
# Fallback to environment variable
|
|
||||||
elif [ -n "$APIFY_INPUT_JSON" ]; then
|
|
||||||
echo "Using APIFY_INPUT_JSON environment variable" >&2
|
|
||||||
input="$APIFY_INPUT_JSON"
|
|
||||||
|
|
||||||
# Last resort: use test input with md format
|
|
||||||
else
|
|
||||||
echo "No input found, using test input with md format" >&2
|
|
||||||
TEST_INPUT='{"documentUrl":"https://vancura.dev/assets/actor-test/facial-hairstyles-and-filtering-facepiece-respirators.pdf","ocr":true,"outputFormat":"md"}'
|
|
||||||
mkdir -p "/tmp/actor-input"
|
|
||||||
echo "$TEST_INPUT" > "/tmp/actor-input/INPUT"
|
|
||||||
|
|
||||||
# Read back the test input to ensure we get clean JSON
|
|
||||||
input=$(cat "/tmp/actor-input/INPUT")
|
|
||||||
fi
|
|
||||||
|
|
||||||
# Return only the JSON content
|
|
||||||
echo "$input"
|
|
||||||
}
|
|
||||||
|
|
||||||
# Get actor input
|
|
||||||
INPUT=$(get_actor_input)
|
|
||||||
echo "Input content:" >&2
|
echo "Input content:" >&2
|
||||||
echo "$INPUT" >&2 # Send the raw input to stderr for debugging
|
echo "$INPUT" >&2 # Send the raw input to stderr for debugging
|
||||||
echo "$INPUT" # Send the clean JSON to stdout for processing
|
echo "$INPUT" # Send the clean JSON to stdout for processing
|
||||||
|
Loading…
Reference in New Issue
Block a user