curl --request POST \
--url https://api.egp.scale.com/v5/inference \
--header 'Content-Type: application/json' \
--header 'x-api-key: <api-key>' \
--data '{
"model": "<string>",
"args": {},
"inference_configuration": {
"timeout_seconds": 123,
"num_retries": 123
}
}'