AI on demand: allenai/olmOCR-2-7B

From MediaWiki
Revision as of 10:18, 28 May 2026 by Sst-yde (talk | contribs) (→‎Calling the model)
(diff) ← Older revision | Latest revision (diff) | Newer revision → (diff)
Jump to navigation Jump to search

Calling the model

The image used in the example to run OCR against.
# Set your personal key:
STONEY_KEY=sk-...

# Set the desired model:
MODEL=allenai/olmOCR-2-7B

# Set the desired document to run OCR against:
FILE_PATH=document.png

# Encode document contents with Base64 and detect MIME type:
FILE_CONTENT_BASE64=$(base64 -w 0 < "$FILE_PATH")
FILE_MIME_TYPE=$(file --brief --mime-type "$FILE_PATH")

curl https://llm.stoney-cloud.com/v1/chat/completions \
        --silent --fail --show-error \
        --header "Authorization: Bearer $STONEY_KEY" \
        --header 'Content-Type: application/json' \
        --data '{
                "model": "'"$MODEL"'",
                "messages": [{
                        "role": "user",
                        "content": [{
                                "type": "image_url",
                                "image_url": {
                                        "url": "data:'"$FILE_MIME_TYPE"';base64,'"$FILE_CONTENT_BASE64"'"
                                }
                        }]
                }],
                "max_tokens": 4096,
                "temperature": 0.2,
                "top_p": 0.9
        }' \
        | jq

Example output:

{
  "id": "chatcmpl-b96a0fa8d921c5ed",
  "object": "chat.completion",
  "created": 1779956243,
  "model": "allenai/olmOCR-2-7B",
  "choices": [
    {
      "index": 0,
      "message": {
        "role": "assistant",
        "content": "This is a lot of 12 point text to test the ocr code and see if it works on all types of file format.\nThe quick brown dog jumped over the lazy fox. The quick brown dog jumped over the lazy fox. The quick brown dog jumped over the lazy fox. The quick brown dog jumped over the lazy fox.",
        "refusal": null,
        "annotations": null,
        "audio": null,
        "function_call": null,
        "tool_calls": [],
        "reasoning": null
      },
      "logprobs": null,
      "finish_reason": "stop",
      "stop_reason": null,
      "token_ids": null
    }
  ],
  "service_tier": null,
  "system_fingerprint": null,
  "usage": {
    "prompt_tokens": 412,
    "total_tokens": 481,
    "completion_tokens": 69,
    "prompt_tokens_details": null
  },
  "prompt_logprobs": null,
  "prompt_token_ids": null,
  "kv_transfer_params": null
}