AI on demand: opendatalab/MinerU2.5-2509-1.2B: Difference between revisions
Jump to navigation
Jump to search
No edit summary |
|||
| (8 intermediate revisions by the same user not shown) | |||
| Line 1: | Line 1: | ||
== Calling the model == | |||
<syntaxhighlight lang="bash"> | |||
# Set your personal key: | |||
STONEY_KEY=sk-... | |||
# Set the desired model: | |||
MODEL=MinerU2.5-2509-1.2B | |||
# Set the desired document to run OCR against: | |||
FILE_PATH=document.png | |||
< | # Encode document contents with Base64 and detect MIME type: | ||
FILE_CONTENT_BASE64=$(base64 -w 0 < "$FILE_PATH") | |||
FILE_MIME_TYPE=$(file --brief --mime-type "$FILE_PATH") | |||
curl https://llm.stoney-cloud.com/v1/chat/completions \ | |||
--silent --fail --show-error \ | |||
--header "Authorization: Bearer $STONEY_KEY" \ | |||
--header 'Content-Type: application/json' \ | |||
--data '{ | |||
"model": "'"$MODEL"'", | |||
"messages": [{ | |||
"role": "user", | |||
"content": [{ | |||
"type": "image_url", | |||
"image_url": { | |||
"url": "data:'"$FILE_MIME_TYPE"';base64,'"$FILE_CONTENT_BASE64"'" | |||
} | |||
}] | |||
}], | |||
"max_tokens": 4096, | |||
"temperature": 0.2, | |||
"top_p": 0.9 | |||
}' \ | |||
| jq | |||
</syntaxhighlight> | |||
Example output: | |||
<syntaxhighlight lang="json"> | |||
{ | |||
"id": "chatcmpl-928cc308fa758fc8", | |||
"object": "chat.completion", | |||
" | "created": 1778491655, | ||
{"role": " | "model": "MinerU2.5-2509-1.2B", | ||
], | "choices": [ | ||
" | { | ||
}" | "index": 0, | ||
"message": { | |||
"role": "assistant", | |||
"content": "This is a lot of 12 point text to test theOCR code and see if it works on all types of file format. The quick brown dog jumped over the lazy fox. The quick brown dog jumped over the lazy fox. The quick brown dog jumped over the lazy fox. The quick brown dog jumped over the lazy fox.", | |||
"refusal": null, | |||
"annotations": null, | |||
"audio": null, | |||
"function_call": null, | |||
"tool_calls": [], | |||
"reasoning": null, | |||
"reasoning_content": null | |||
}, | |||
"logprobs": null, | |||
"finish_reason": "stop", | |||
"stop_reason": null, | |||
"token_ids": null | |||
} | |||
], | |||
"service_tier": null, | |||
"system_fingerprint": null, | |||
"usage": { | |||
"prompt_tokens": 412, | |||
"total_tokens": 480, | |||
"completion_tokens": 68, | |||
"prompt_tokens_details": null | |||
}, | |||
"prompt_logprobs": null, | |||
"prompt_token_ids": null, | |||
"kv_transfer_params": null | |||
} | |||
</syntaxhighlight> | </syntaxhighlight> | ||
[[Category:AI on demand]] | [[Category:AI on demand]] | ||
Latest revision as of 11:28, 11 May 2026
Calling the model
# Set your personal key:
STONEY_KEY=sk-...
# Set the desired model:
MODEL=MinerU2.5-2509-1.2B
# Set the desired document to run OCR against:
FILE_PATH=document.png
# Encode document contents with Base64 and detect MIME type:
FILE_CONTENT_BASE64=$(base64 -w 0 < "$FILE_PATH")
FILE_MIME_TYPE=$(file --brief --mime-type "$FILE_PATH")
curl https://llm.stoney-cloud.com/v1/chat/completions \
--silent --fail --show-error \
--header "Authorization: Bearer $STONEY_KEY" \
--header 'Content-Type: application/json' \
--data '{
"model": "'"$MODEL"'",
"messages": [{
"role": "user",
"content": [{
"type": "image_url",
"image_url": {
"url": "data:'"$FILE_MIME_TYPE"';base64,'"$FILE_CONTENT_BASE64"'"
}
}]
}],
"max_tokens": 4096,
"temperature": 0.2,
"top_p": 0.9
}' \
| jq
Example output:
{
"id": "chatcmpl-928cc308fa758fc8",
"object": "chat.completion",
"created": 1778491655,
"model": "MinerU2.5-2509-1.2B",
"choices": [
{
"index": 0,
"message": {
"role": "assistant",
"content": "This is a lot of 12 point text to test theOCR code and see if it works on all types of file format. The quick brown dog jumped over the lazy fox. The quick brown dog jumped over the lazy fox. The quick brown dog jumped over the lazy fox. The quick brown dog jumped over the lazy fox.",
"refusal": null,
"annotations": null,
"audio": null,
"function_call": null,
"tool_calls": [],
"reasoning": null,
"reasoning_content": null
},
"logprobs": null,
"finish_reason": "stop",
"stop_reason": null,
"token_ids": null
}
],
"service_tier": null,
"system_fingerprint": null,
"usage": {
"prompt_tokens": 412,
"total_tokens": 480,
"completion_tokens": 68,
"prompt_tokens_details": null
},
"prompt_logprobs": null,
"prompt_token_ids": null,
"kv_transfer_params": null
}