POST
/
v4
/
model-templates
import SGPClient from 'sgp';

const client = new SGPClient({
  apiKey: process.env['SGP_API_KEY'], // This is the default and can be omitted
});

async function main() {
  const modelTemplate = await client.modelTemplates.create({
    account_id: 'account_id',
    endpoint_type: 'SYNC',
    model_type: 'COMPLETION',
    name: 'name',
    vendor_configuration: { bundle_config: { image: 'image', registry: 'registry', tag: 'tag' } },
  });

  console.log(modelTemplate.id);
}

main();
{
  "name": "<string>",
  "endpoint_type": "SYNC",
  "model_type": "COMPLETION",
  "vendor_configuration": {
    "vendor": "LAUNCH",
    "bundle_config": {
      "registry": "<string>",
      "image": "<string>",
      "tag": "<string>",
      "command": [
        "<string>"
      ],
      "env": {},
      "streaming_command": [
        "<string>"
      ],
      "readiness_initial_delay_seconds": 120,
      "healthcheck_route": "/readyz",
      "predict_route": "/predict",
      "streaming_predict_route": "/generate_streaming"
    },
    "endpoint_config": {
      "cpus": 3,
      "memory": "8Gi",
      "storage": "16Gi",
      "gpus": 0,
      "gpu_type": "nvidia-tesla-t4",
      "min_workers": 0,
      "max_workers": 1,
      "per_worker": 10,
      "endpoint_type": "ASYNC",
      "high_priority": false
    },
    "fine_tuning_job_bundle_config": {
      "registry": "<string>",
      "image": "<string>",
      "tag": "<string>",
      "command": [
        "<string>"
      ],
      "env": {},
      "mount_location": "/workspace/launch_specific/config.json",
      "training_dataset_schema_type": "GENERATION",
      "resources": {
        "cpus": 3,
        "memory": "8Gi",
        "storage": "16Gi",
        "gpus": 0,
        "gpu_type": "nvidia-tesla-t4"
      }
    }
  },
  "model_creation_parameters_schema": {
    "parameters": [
      {
        "name": "<string>",
        "type": "str",
        "description": "<string>",
        "required": true
      }
    ]
  },
  "model_request_parameters_schema": {
    "parameters": [
      {
        "name": "<string>",
        "type": "str",
        "description": "<string>",
        "required": true
      }
    ]
  },
  "endpoint_protocol": "SGP",
  "id": "<string>",
  "created_at": "2023-11-07T05:31:56Z",
  "account_id": "<string>",
  "created_by_user_id": "<string>"
}

Authorizations

x-api-key
string
header
required

Headers

x-selected-account-id
string

Body

application/json

Response

200
application/json

Successful Response

The response is of type object.