Create Evaluation

curl --request POST \
  --url https://api.egp.scale.com/v5/evaluations \
  --header 'Content-Type: application/json' \
  --header 'x-api-key: <api-key>' \
  --data '
{
  "name": "<string>",
  "data": [
    {}
  ],
  "description": "<string>",
  "tags": [
    "<string>"
  ],
  "tasks": [
    {
      "configuration": {
        "model": "<string>",
        "messages": [
          {}
        ],
        "top_k": 123,
        "frequency_penalty": 123,
        "function_call": {},
        "functions": [
          {}
        ],
        "logit_bias": {},
        "logprobs": true,
        "max_completion_tokens": 123,
        "max_tokens": 123,
        "metadata": {},
        "modalities": [
          "<string>"
        ],
        "n": 123,
        "parallel_tool_calls": true,
        "prediction": {},
        "presence_penalty": 123,
        "reasoning_effort": "<string>",
        "response_format": {},
        "seed": 123,
        "stop": "<string>",
        "store": true,
        "temperature": 123,
        "tool_choice": "<string>",
        "tools": [
          {}
        ],
        "top_logprobs": 123,
        "top_p": 123,
        "audio": {}
      },
      "task_type": "chat_completion",
      "alias": "chat_completion"
    }
  ],
  "metadata": {},
  "files": [
    {}
  ]
}
'

{
  "id": "<string>",
  "name": "<string>",
  "created_at": "2023-11-07T05:31:56Z",
  "created_by": {
    "id": "<string>",
    "type": "user",
    "object": "identity"
  },
  "tags": [
    "<string>"
  ],
  "datasets": [
    {
      "id": "<string>",
      "created_by": {
        "id": "<string>",
        "type": "user",
        "object": "identity"
      },
      "name": "<string>",
      "created_at": "2023-11-07T05:31:56Z",
      "tags": [
        "<string>"
      ],
      "current_version_num": 123,
      "object": "dataset",
      "description": "<string>",
      "archived_at": "2023-11-07T05:31:56Z"
    }
  ],
  "status": "failed",
  "object": "evaluation",
  "description": "<string>",
  "archived_at": "2023-11-07T05:31:56Z",
  "status_reason": "<string>",
  "progress": {
    "workflows": {
      "total": 123,
      "completed": 123,
      "failed": 123,
      "pending": 123
    },
    "items": {
      "total": 123,
      "successful": 123,
      "failed": 123,
      "pending": 123,
      "failed_items": []
    }
  },
  "tasks": [
    {
      "configuration": {
        "model": "<string>",
        "messages": [
          {}
        ],
        "top_k": 123,
        "frequency_penalty": 123,
        "function_call": {},
        "functions": [
          {}
        ],
        "logit_bias": {},
        "logprobs": true,
        "max_completion_tokens": 123,
        "max_tokens": 123,
        "metadata": {},
        "modalities": [
          "<string>"
        ],
        "n": 123,
        "parallel_tool_calls": true,
        "prediction": {},
        "presence_penalty": 123,
        "reasoning_effort": "<string>",
        "response_format": {},
        "seed": 123,
        "stop": "<string>",
        "store": true,
        "temperature": 123,
        "tool_choice": "<string>",
        "tools": [
          {}
        ],
        "top_logprobs": 123,
        "top_p": 123,
        "audio": {}
      },
      "task_type": "chat_completion",
      "alias": "chat_completion"
    }
  ],
  "metadata": {}
}

POST

evaluations

Create Evaluation

curl --request POST \
  --url https://api.egp.scale.com/v5/evaluations \
  --header 'Content-Type: application/json' \
  --header 'x-api-key: <api-key>' \
  --data '
{
  "name": "<string>",
  "data": [
    {}
  ],
  "description": "<string>",
  "tags": [
    "<string>"
  ],
  "tasks": [
    {
      "configuration": {
        "model": "<string>",
        "messages": [
          {}
        ],
        "top_k": 123,
        "frequency_penalty": 123,
        "function_call": {},
        "functions": [
          {}
        ],
        "logit_bias": {},
        "logprobs": true,
        "max_completion_tokens": 123,
        "max_tokens": 123,
        "metadata": {},
        "modalities": [
          "<string>"
        ],
        "n": 123,
        "parallel_tool_calls": true,
        "prediction": {},
        "presence_penalty": 123,
        "reasoning_effort": "<string>",
        "response_format": {},
        "seed": 123,
        "stop": "<string>",
        "store": true,
        "temperature": 123,
        "tool_choice": "<string>",
        "tools": [
          {}
        ],
        "top_logprobs": 123,
        "top_p": 123,
        "audio": {}
      },
      "task_type": "chat_completion",
      "alias": "chat_completion"
    }
  ],
  "metadata": {},
  "files": [
    {}
  ]
}
'

{
  "id": "<string>",
  "name": "<string>",
  "created_at": "2023-11-07T05:31:56Z",
  "created_by": {
    "id": "<string>",
    "type": "user",
    "object": "identity"
  },
  "tags": [
    "<string>"
  ],
  "datasets": [
    {
      "id": "<string>",
      "created_by": {
        "id": "<string>",
        "type": "user",
        "object": "identity"
      },
      "name": "<string>",
      "created_at": "2023-11-07T05:31:56Z",
      "tags": [
        "<string>"
      ],
      "current_version_num": 123,
      "object": "dataset",
      "description": "<string>",
      "archived_at": "2023-11-07T05:31:56Z"
    }
  ],
  "status": "failed",
  "object": "evaluation",
  "description": "<string>",
  "archived_at": "2023-11-07T05:31:56Z",
  "status_reason": "<string>",
  "progress": {
    "workflows": {
      "total": 123,
      "completed": 123,
      "failed": 123,
      "pending": 123
    },
    "items": {
      "total": 123,
      "successful": 123,
      "failed": 123,
      "pending": 123,
      "failed_items": []
    }
  },
  "tasks": [
    {
      "configuration": {
        "model": "<string>",
        "messages": [
          {}
        ],
        "top_k": 123,
        "frequency_penalty": 123,
        "function_call": {},
        "functions": [
          {}
        ],
        "logit_bias": {},
        "logprobs": true,
        "max_completion_tokens": 123,
        "max_tokens": 123,
        "metadata": {},
        "modalities": [
          "<string>"
        ],
        "n": 123,
        "parallel_tool_calls": true,
        "prediction": {},
        "presence_penalty": 123,
        "reasoning_effort": "<string>",
        "response_format": {},
        "seed": 123,
        "stop": "<string>",
        "store": true,
        "temperature": 123,
        "tool_choice": "<string>",
        "tools": [
          {}
        ],
        "top_logprobs": 123,
        "top_p": 123,
        "audio": {}
      },
      "task_type": "chat_completion",
      "alias": "chat_completion"
    }
  ],
  "metadata": {}
}

Authorizations

x-api-key

string

header

required

Headers

x-selected-account-id

string | null

Body

application/json

EvaluationStandaloneCreateRequest
EvaluationFromDatasetCreateRequest
EvaluationWithDatasetCreateRequest

name

string

required

data

Data · object[]

required

Items to be evaluated

Minimum array length: 1

description

string

Response

Successful Response

string

required

name

string

required

created_at

string<date-time>

required

created_by

Identity · object

required

The identity that created the entity.

Show child attributes

Inference

Questions

Files

Models

Datasets

Dataset Items

Evaluations

Evaluation Groups

Evaluation Charts

Evaluation Items

Spans

Span Assessment

Credentials

Create Evaluation

Authorizations

Headers

Body

Response