import SGPClient from 'sgp';
const client = new SGPClient({
apiKey: 'My API Key',
});
// Automatically fetches more pages as needed.
for await (const modelDeployment of client.models.deployments.listAll()) {
console.log(modelDeployment.id);
}{
"items": [
{
"name": "<string>",
"id": "<string>",
"created_at": "2023-11-07T05:31:56Z",
"account_id": "<string>",
"created_by_user_id": "<string>",
"created_by_identity_type": "user",
"status": "<string>",
"model_creation_parameters": {},
"model_endpoint_id": "<string>",
"model_instance_id": "<string>",
"vendor_configuration": {
"min_workers": 0,
"max_workers": 1,
"per_worker": 10,
"vendor": "LAUNCH"
},
"deployment_metadata": {}
}
],
"total_item_count": 123,
"current_page": 123,
"items_per_page": 123
}TODO: Document
import SGPClient from 'sgp';
const client = new SGPClient({
apiKey: 'My API Key',
});
// Automatically fetches more pages as needed.
for await (const modelDeployment of client.models.deployments.listAll()) {
console.log(modelDeployment.id);
}{
"items": [
{
"name": "<string>",
"id": "<string>",
"created_at": "2023-11-07T05:31:56Z",
"account_id": "<string>",
"created_by_user_id": "<string>",
"created_by_identity_type": "user",
"status": "<string>",
"model_creation_parameters": {},
"model_endpoint_id": "<string>",
"model_instance_id": "<string>",
"vendor_configuration": {
"min_workers": 0,
"max_workers": 1,
"per_worker": 10,
"vendor": "LAUNCH"
},
"deployment_metadata": {}
}
],
"total_item_count": 123,
"current_page": 123,
"items_per_page": 123
}model_creation_parameters:asc, model_creation_parameters:desc, model_endpoint_id:asc, model_endpoint_id:desc, model_instance_id:asc, model_instance_id:desc, vendor_configuration:asc, vendor_configuration:desc, deployment_metadata:asc, deployment_metadata:desc, status:asc, status:desc, id:asc, id:desc, created_at:asc, created_at:desc, account_id:asc, account_id:desc, created_by_user_id:asc, created_by_user_id:desc, created_by_identity_type:asc, created_by_identity_type:desc, name:asc, name:desc Optional filter by account id
Page number for pagination to be returned by the given endpoint. Starts at page 1
x >= 1Maximum number of artifacts to be returned by the given endpoint. Defaults to 100 and cannot be greater than 10k.
1 <= x <= 10000Successful Response
The data returned for the current page.
Show child attributes
The unique identifier of the entity.
The date and time when the entity was created in ISO format.
The ID of the account that owns the given entity.
The user who originally created the entity.
The type of identity that created the entity.
user, service_account Status of the model's deployment.
Show child attributes
The maximum number of concurrent requests that an individual worker can
service. Launch automatically scales the number of workers for the endpoint so that
each worker is processing per_worker requests, subject to the limits defined by
min_workers and max_workers.
per_worker, then the number of workers will be reduced. - Otherwise,
if the average number of concurrent requests per worker is higher than
per_worker, then the number of workers will be increased to meet the elevated
traffic.Here is our recommendation for computing per_worker:
min_workers and max_workers per your minimum and maximum
throughput requirements. 2. Determine a value for the maximum number of
concurrent requests in the workload. Divide this number by max_workers. Doing
this ensures that the number of workers will "climb" to max_workers."LAUNCH"The total number of items of the query
The current page number.
The number of items per page.