Download OpenAPI specification:
API REST server for evaluation backend orchestration
Create and execute evaluation request using the simplified benchmark schema.
| name required | string The evaluation job name. |
| description | string The evaluation job description. |
| tags | Array of strings The evaluation job tags. |
required | object (ModelRef) The model to evaluate. |
required | Array of objects (EvaluationBenchmarkConfig) The evaluation benchmarks to run. |
object (PassCriteria) The overall pass criteria for the evaluation job. | |
object (ExperimentConfig) The MLFlow experiment configuration. When provided, the evaluation job will be tracked in MLFlow. | |
object (EvaluationExports) Optional exports configuration for the evaluation job. When provided, the evaluation job results will be exported to the specified location. | |
object Custom request data. This can be used for user specific job data. |
{- "name": "string",
- "description": "string",
- "tags": [
- "string"
], - "model": {
- "url": "string",
- "name": "string",
- "parameters": { },
- "auth": {
- "secret_ref": "string"
}
}, - "benchmarks": [
- {
- "id": "string",
- "provider_id": "string",
- "weight": 1,
- "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}, - "parameters": { },
- "test_data_ref": {
- "s3": {
- "bucket": "my-eval-bucket",
- "key": "datasets/benchmark-a/v1",
- "secret_ref": "my-s3-connection-secret"
}
}
}
], - "pass_criteria": {
- "threshold": 0
}, - "experiment": {
- "name": "string",
- "tags": [
- {
- "key": "string",
- "value": "string"
}
], - "artifact_location": "string"
}, - "exports": {
- "oci": {
- "coordinates": {
- "oci_host": "string",
- "oci_repository": "string",
- "oci_tag": "string",
- "oci_subject": "string",
- "annotations": {
- "property1": "string",
- "property2": "string"
}
}, - "k8s": {
- "connection": "string"
}
}
}, - "custom": { }
}{- "name": "string",
- "description": "string",
- "tags": [
- "string"
], - "model": {
- "url": "string",
- "name": "string",
- "parameters": { },
- "auth": {
- "secret_ref": "string"
}
}, - "benchmarks": [
- {
- "id": "string",
- "provider_id": "string",
- "weight": 1,
- "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}, - "parameters": { },
- "test_data_ref": {
- "s3": {
- "bucket": "my-eval-bucket",
- "key": "datasets/benchmark-a/v1",
- "secret_ref": "my-s3-connection-secret"
}
}
}
], - "pass_criteria": {
- "threshold": 0
}, - "experiment": {
- "name": "string",
- "tags": [
- {
- "key": "string",
- "value": "string"
}
], - "artifact_location": "string"
}, - "exports": {
- "oci": {
- "coordinates": {
- "oci_host": "string",
- "oci_repository": "string",
- "oci_tag": "string",
- "oci_subject": "string",
- "annotations": {
- "property1": "string",
- "property2": "string"
}
}, - "k8s": {
- "connection": "string"
}
}
}, - "custom": { },
- "resource": {
- "id": "string",
- "tenant": "string",
- "created_at": "2019-08-24T14:15:22Z",
- "updated_at": "2019-08-24T14:15:22Z",
- "owner": "string",
- "mlflow_experiment_id": "string"
}, - "status": {
- "state": "pending",
- "message": {
- "message": "string",
- "message_code": "string"
}, - "benchmarks": [
- {
- "provider_id": "string",
- "id": "string",
- "benchmark_index": 0,
- "status": "pending",
- "error_message": {
- "message": "string",
- "message_code": "string"
}, - "started_at": "2019-08-24T14:15:22Z",
- "completed_at": "2019-08-24T14:15:22Z"
}
]
}, - "results": {
- "benchmarks": [
- {
- "id": "string",
- "provider_id": "string",
- "benchmark_index": 0,
- "metrics": { },
- "artifacts": { },
- "mlflow_run_id": "string",
- "logs_path": "string",
- "test": {
- "primary_score": 0.1,
- "threshold": 0.1,
- "pass": true
}
}
], - "mlflow_experiment_url": "string",
- "test": {
- "score": 0.1,
- "threshold": 0.1,
- "pass": true
}
}
}List all evaluation requests.
| limit | integer (Limit) [ 1 .. 100 ] Default: 50 Maximum number of evaluations to return |
| offset | integer (Offset) >= 0 Default: 0 Offset for pagination |
| status | string (Status Filter) Filter by status |
| name | string (Name) Name to search for |
| tags | string (Tags) Tags to search for |
{- "first": {
- "href": "string"
}, - "next": {
- "href": "string"
}, - "limit": 0,
- "total_count": 0,
- "items": [
- {
- "resource": {
- "id": "string",
- "tenant": "string",
- "created_at": "2019-08-24T14:15:22Z",
- "updated_at": "2019-08-24T14:15:22Z",
- "owner": "string",
- "mlflow_experiment_id": "string"
}, - "status": {
- "state": "pending",
- "message": {
- "message": "string",
- "message_code": "string"
}, - "benchmarks": [
- {
- "provider_id": "string",
- "id": "string",
- "benchmark_index": 0,
- "status": "pending",
- "error_message": {
- "message": "string",
- "message_code": "string"
}, - "started_at": "2019-08-24T14:15:22Z",
- "completed_at": "2019-08-24T14:15:22Z"
}
]
}, - "results": {
- "benchmarks": [
- {
- "id": "string",
- "provider_id": "string",
- "benchmark_index": 0,
- "metrics": { },
- "artifacts": { },
- "mlflow_run_id": "string",
- "logs_path": "string",
- "test": {
- "primary_score": 0.1,
- "threshold": 0.1,
- "pass": true
}
}
], - "mlflow_experiment_url": "string",
- "test": {
- "score": 0.1,
- "threshold": 0.1,
- "pass": true
}
}, - "name": "string",
- "description": "string",
- "tags": [
- "string"
], - "model": {
- "url": "string",
- "name": "string",
- "parameters": { },
- "auth": {
- "secret_ref": "string"
}
}, - "benchmarks": [
- {
- "id": "string",
- "provider_id": "string",
- "weight": 1,
- "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}, - "parameters": { },
- "test_data_ref": {
- "s3": {
- "bucket": "my-eval-bucket",
- "key": "datasets/benchmark-a/v1",
- "secret_ref": "my-s3-connection-secret"
}
}
}
], - "pass_criteria": {
- "threshold": 0
}, - "experiment": {
- "name": "string",
- "tags": [
- {
- "key": "string",
- "value": "string"
}
], - "artifact_location": "string"
}, - "exports": {
- "oci": {
- "coordinates": {
- "oci_host": "string",
- "oci_repository": "string",
- "oci_tag": "string",
- "oci_subject": "string",
- "annotations": {
- "property1": "string",
- "property2": "string"
}
}, - "k8s": {
- "connection": "string"
}
}
}, - "custom": { }
}
], - "errors": [
- "string"
]
}Returns the evaluation job resource with the current status and results.
| id required | string (Id) |
{- "name": "string",
- "description": "string",
- "tags": [
- "string"
], - "model": {
- "url": "string",
- "name": "string",
- "parameters": { },
- "auth": {
- "secret_ref": "string"
}
}, - "benchmarks": [
- {
- "id": "string",
- "provider_id": "string",
- "weight": 1,
- "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}, - "parameters": { },
- "test_data_ref": {
- "s3": {
- "bucket": "my-eval-bucket",
- "key": "datasets/benchmark-a/v1",
- "secret_ref": "my-s3-connection-secret"
}
}
}
], - "pass_criteria": {
- "threshold": 0
}, - "experiment": {
- "name": "string",
- "tags": [
- {
- "key": "string",
- "value": "string"
}
], - "artifact_location": "string"
}, - "exports": {
- "oci": {
- "coordinates": {
- "oci_host": "string",
- "oci_repository": "string",
- "oci_tag": "string",
- "oci_subject": "string",
- "annotations": {
- "property1": "string",
- "property2": "string"
}
}, - "k8s": {
- "connection": "string"
}
}
}, - "custom": { },
- "resource": {
- "id": "string",
- "tenant": "string",
- "created_at": "2019-08-24T14:15:22Z",
- "updated_at": "2019-08-24T14:15:22Z",
- "owner": "string",
- "mlflow_experiment_id": "string"
}, - "status": {
- "state": "pending",
- "message": {
- "message": "string",
- "message_code": "string"
}, - "benchmarks": [
- {
- "provider_id": "string",
- "id": "string",
- "benchmark_index": 0,
- "status": "pending",
- "error_message": {
- "message": "string",
- "message_code": "string"
}, - "started_at": "2019-08-24T14:15:22Z",
- "completed_at": "2019-08-24T14:15:22Z"
}
]
}, - "results": {
- "benchmarks": [
- {
- "id": "string",
- "provider_id": "string",
- "benchmark_index": 0,
- "metrics": { },
- "artifacts": { },
- "mlflow_run_id": "string",
- "logs_path": "string",
- "test": {
- "primary_score": 0.1,
- "threshold": 0.1,
- "pass": true
}
}
], - "mlflow_experiment_url": "string",
- "test": {
- "score": 0.1,
- "threshold": 0.1,
- "pass": true
}
}
}Cancel a running evaluation.
| id required | string (Id) |
| hard_delete | boolean (Hard Delete) Default: false If |
{- "message": "The field 'state' is not valid.",
- "message_code": "invalid_value",
- "trace": "b12692e1-8582-4628-88ca-7a13fefb73e2"
}List all benchmark collections.
| limit | integer (Limit) [ 1 .. 100 ] Default: 50 Maximum number of collections to return |
| offset | integer (Offset) >= 0 Default: 0 Offset for pagination |
| name | string (Name) Name to search for |
| category | string (Category) Category to search for |
| tags | string (Tags) Tags to search for |
| scope | string (Scope of collections) Enum: "system" "tenant" Set to |
{- "first": {
- "href": "string"
}, - "next": {
- "href": "string"
}, - "limit": 0,
- "total_count": 0,
- "items": [
- {
- "resource": {
- "id": "string",
- "tenant": "string",
- "created_at": "2019-08-24T14:15:22Z",
- "updated_at": "2019-08-24T14:15:22Z",
- "owner": "string"
}, - "name": "string",
- "category": "string",
- "description": "string",
- "tags": [
- "string"
], - "custom": { },
- "pass_criteria": {
- "threshold": 0
}, - "benchmarks": [
- {
- "id": "string",
- "provider_id": "string",
- "url": "string",
- "weight": 1,
- "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}, - "parameters": { },
- "test_data_ref": {
- "s3": {
- "bucket": "my-eval-bucket",
- "key": "datasets/benchmark-a/v1",
- "secret_ref": "my-s3-connection-secret"
}
}
}
]
}
]
}Create a new collection.
| name required | string Collection name. |
| category required | string Collection category. |
| description | string Optional description. |
| tags | Array of strings Tags. |
object Custom key-value data. | |
object (PassCriteria) Pass criteria for the collection. | |
required | Array of objects (CollectionBenchmarkConfig) Benchmarks in the collection. |
{- "name": "string",
- "category": "string",
- "description": "string",
- "tags": [
- "string"
], - "custom": { },
- "pass_criteria": {
- "threshold": 0
}, - "benchmarks": [
- {
- "id": "string",
- "provider_id": "string",
- "url": "string",
- "weight": 1,
- "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}, - "parameters": { },
- "test_data_ref": {
- "s3": {
- "bucket": "my-eval-bucket",
- "key": "datasets/benchmark-a/v1",
- "secret_ref": "my-s3-connection-secret"
}
}
}
]
}{- "resource": {
- "id": "string",
- "tenant": "string",
- "created_at": "2019-08-24T14:15:22Z",
- "updated_at": "2019-08-24T14:15:22Z",
- "owner": "string"
}, - "name": "string",
- "category": "string",
- "description": "string",
- "tags": [
- "string"
], - "custom": { },
- "pass_criteria": {
- "threshold": 0
}, - "benchmarks": [
- {
- "id": "string",
- "provider_id": "string",
- "url": "string",
- "weight": 1,
- "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}, - "parameters": { },
- "test_data_ref": {
- "s3": {
- "bucket": "my-eval-bucket",
- "key": "datasets/benchmark-a/v1",
- "secret_ref": "my-s3-connection-secret"
}
}
}
]
}Get details of a specific collection.
| id required | string (Collection Id) |
{- "resource": {
- "id": "string",
- "tenant": "string",
- "created_at": "2019-08-24T14:15:22Z",
- "updated_at": "2019-08-24T14:15:22Z",
- "owner": "string"
}, - "name": "string",
- "category": "string",
- "description": "string",
- "tags": [
- "string"
], - "custom": { },
- "pass_criteria": {
- "threshold": 0
}, - "benchmarks": [
- {
- "id": "string",
- "provider_id": "string",
- "url": "string",
- "weight": 1,
- "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}, - "parameters": { },
- "test_data_ref": {
- "s3": {
- "bucket": "my-eval-bucket",
- "key": "datasets/benchmark-a/v1",
- "secret_ref": "my-s3-connection-secret"
}
}
}
]
}Update an existing collection.
| id required | string (Collection Id) |
| name required | string Collection name. |
| category required | string Collection category. |
| description | string Optional description. |
| tags | Array of strings Tags. |
object Custom key-value data. | |
object (PassCriteria) Pass criteria for the collection. | |
required | Array of objects (CollectionBenchmarkConfig) Benchmarks in the collection. |
{- "name": "string",
- "category": "string",
- "description": "string",
- "tags": [
- "string"
], - "custom": { },
- "pass_criteria": {
- "threshold": 0
}, - "benchmarks": [
- {
- "id": "string",
- "provider_id": "string",
- "url": "string",
- "weight": 1,
- "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}, - "parameters": { },
- "test_data_ref": {
- "s3": {
- "bucket": "my-eval-bucket",
- "key": "datasets/benchmark-a/v1",
- "secret_ref": "my-s3-connection-secret"
}
}
}
]
}{- "resource": {
- "id": "string",
- "tenant": "string",
- "created_at": "2019-08-24T14:15:22Z",
- "updated_at": "2019-08-24T14:15:22Z",
- "owner": "string"
}, - "name": "string",
- "category": "string",
- "description": "string",
- "tags": [
- "string"
], - "custom": { },
- "pass_criteria": {
- "threshold": 0
}, - "benchmarks": [
- {
- "id": "string",
- "provider_id": "string",
- "url": "string",
- "weight": 1,
- "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}, - "parameters": { },
- "test_data_ref": {
- "s3": {
- "bucket": "my-eval-bucket",
- "key": "datasets/benchmark-a/v1",
- "secret_ref": "my-s3-connection-secret"
}
}
}
]
}Partially update an existing collection.
| id required | string (Collection Id) |
| op required | string (PatchOp) Enum: "replace" "add" "remove" Patch operation type |
| path required | string JSON Pointer path |
| value | any Value for add/replace (omit for remove) |
[- {
- "op": "replace",
- "path": "string",
- "value": null
}
]{- "resource": {
- "id": "string",
- "tenant": "string",
- "created_at": "2019-08-24T14:15:22Z",
- "updated_at": "2019-08-24T14:15:22Z",
- "owner": "string"
}, - "name": "string",
- "category": "string",
- "description": "string",
- "tags": [
- "string"
], - "custom": { },
- "pass_criteria": {
- "threshold": 0
}, - "benchmarks": [
- {
- "id": "string",
- "provider_id": "string",
- "url": "string",
- "weight": 1,
- "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}, - "parameters": { },
- "test_data_ref": {
- "s3": {
- "bucket": "my-eval-bucket",
- "key": "datasets/benchmark-a/v1",
- "secret_ref": "my-s3-connection-secret"
}
}
}
]
}List all registered evaluation providers.
| limit | integer (Limit) [ 1 .. 100 ] Default: 50 Maximum number of providers to return |
| offset | integer (Offset) >= 0 Default: 0 Offset for pagination |
| benchmarks | boolean (Benchmarks) Default: true Include or exclude benchmarks supported by this provider in the response |
| name | string (Name) Name to search for |
| tags | string (Tags) Tags to search for |
| scope | string (Scope of providers) Enum: "system" "tenant" Set to |
{- "first": {
- "href": "string"
}, - "next": {
- "href": "string"
}, - "limit": 0,
- "total_count": 0,
- "items": [
- {
- "resource": {
- "id": "string",
- "tenant": "string",
- "created_at": "2019-08-24T14:15:22Z",
- "updated_at": "2019-08-24T14:15:22Z",
- "owner": "string"
}, - "name": "string",
- "title": "string",
- "description": "string",
- "tags": [
- "string"
], - "runtime": {
- "k8s": {
- "image": "string",
- "entrypoint": [
- "string"
], - "cpu_request": "string",
- "memory_request": "string",
- "cpu_limit": "string",
- "memory_limit": "string",
- "env": [
- {
- "name": "string",
- "value": "string"
}
]
}, - "local": {
- "command": "string",
- "env": [
- {
- "name": "string",
- "value": "string"
}
]
}
}, - "benchmarks": [
- {
- "id": "string",
- "url": "string",
- "name": "string",
- "description": "string",
- "category": "string",
- "metrics": [
- "string"
], - "num_few_shot": 0,
- "dataset_size": 0,
- "tags": [
- "string"
], - "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}
}
]
}
], - "errors": [
- "string"
]
}Create a new provider scoped to the current tenant (Bring Your Own Provider)
| name required | string Provider name |
| title | string Provider display title |
| description | string Provider description |
| tags | Array of strings Provider tags |
required | object (Runtime) Provider runtime configuration |
required | Array of objects (BenchmarkResource) Benchmarks offered by this provider |
{- "name": "string",
- "title": "string",
- "description": "string",
- "tags": [
- "string"
], - "runtime": {
- "k8s": {
- "image": "string",
- "entrypoint": [
- "string"
], - "cpu_request": "string",
- "memory_request": "string",
- "cpu_limit": "string",
- "memory_limit": "string",
- "env": [
- {
- "name": "string",
- "value": "string"
}
]
}, - "local": {
- "command": "string",
- "env": [
- {
- "name": "string",
- "value": "string"
}
]
}
}, - "benchmarks": [
- {
- "id": "string",
- "url": "string",
- "name": "string",
- "description": "string",
- "category": "string",
- "metrics": [
- "string"
], - "num_few_shot": 0,
- "dataset_size": 0,
- "tags": [
- "string"
], - "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}
}
]
}{- "resource": {
- "id": "string",
- "tenant": "string",
- "created_at": "2019-08-24T14:15:22Z",
- "updated_at": "2019-08-24T14:15:22Z",
- "owner": "string"
}, - "name": "string",
- "title": "string",
- "description": "string",
- "tags": [
- "string"
], - "runtime": {
- "k8s": {
- "image": "string",
- "entrypoint": [
- "string"
], - "cpu_request": "string",
- "memory_request": "string",
- "cpu_limit": "string",
- "memory_limit": "string",
- "env": [
- {
- "name": "string",
- "value": "string"
}
]
}, - "local": {
- "command": "string",
- "env": [
- {
- "name": "string",
- "value": "string"
}
]
}
}, - "benchmarks": [
- {
- "id": "string",
- "url": "string",
- "name": "string",
- "description": "string",
- "category": "string",
- "metrics": [
- "string"
], - "num_few_shot": 0,
- "dataset_size": 0,
- "tags": [
- "string"
], - "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}
}
]
}Get a provider by ID.
| id required | string (Provider Id) Provider ID |
{- "resource": {
- "id": "string",
- "tenant": "string",
- "created_at": "2019-08-24T14:15:22Z",
- "updated_at": "2019-08-24T14:15:22Z",
- "owner": "string"
}, - "name": "string",
- "title": "string",
- "description": "string",
- "tags": [
- "string"
], - "runtime": {
- "k8s": {
- "image": "string",
- "entrypoint": [
- "string"
], - "cpu_request": "string",
- "memory_request": "string",
- "cpu_limit": "string",
- "memory_limit": "string",
- "env": [
- {
- "name": "string",
- "value": "string"
}
]
}, - "local": {
- "command": "string",
- "env": [
- {
- "name": "string",
- "value": "string"
}
]
}
}, - "benchmarks": [
- {
- "id": "string",
- "url": "string",
- "name": "string",
- "description": "string",
- "category": "string",
- "metrics": [
- "string"
], - "num_few_shot": 0,
- "dataset_size": 0,
- "tags": [
- "string"
], - "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}
}
]
}Update an existing provider.
| id required | string (Provider Id) Provider ID |
| name required | string Provider name |
| title | string Provider display title |
| description | string Provider description |
| tags | Array of strings Provider tags |
required | object (Runtime) Provider runtime configuration |
required | Array of objects (BenchmarkResource) Benchmarks offered by this provider |
{- "name": "string",
- "title": "string",
- "description": "string",
- "tags": [
- "string"
], - "runtime": {
- "k8s": {
- "image": "string",
- "entrypoint": [
- "string"
], - "cpu_request": "string",
- "memory_request": "string",
- "cpu_limit": "string",
- "memory_limit": "string",
- "env": [
- {
- "name": "string",
- "value": "string"
}
]
}, - "local": {
- "command": "string",
- "env": [
- {
- "name": "string",
- "value": "string"
}
]
}
}, - "benchmarks": [
- {
- "id": "string",
- "url": "string",
- "name": "string",
- "description": "string",
- "category": "string",
- "metrics": [
- "string"
], - "num_few_shot": 0,
- "dataset_size": 0,
- "tags": [
- "string"
], - "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}
}
]
}{- "resource": {
- "id": "string",
- "tenant": "string",
- "created_at": "2019-08-24T14:15:22Z",
- "updated_at": "2019-08-24T14:15:22Z",
- "owner": "string"
}, - "name": "string",
- "title": "string",
- "description": "string",
- "tags": [
- "string"
], - "runtime": {
- "k8s": {
- "image": "string",
- "entrypoint": [
- "string"
], - "cpu_request": "string",
- "memory_request": "string",
- "cpu_limit": "string",
- "memory_limit": "string",
- "env": [
- {
- "name": "string",
- "value": "string"
}
]
}, - "local": {
- "command": "string",
- "env": [
- {
- "name": "string",
- "value": "string"
}
]
}
}, - "benchmarks": [
- {
- "id": "string",
- "url": "string",
- "name": "string",
- "description": "string",
- "category": "string",
- "metrics": [
- "string"
], - "num_few_shot": 0,
- "dataset_size": 0,
- "tags": [
- "string"
], - "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}
}
]
}Partially update an existing provider.
| id required | string (Provider Id) |
| op required | string (PatchOp) Enum: "replace" "add" "remove" Patch operation type |
| path required | string JSON Pointer path |
| value | any Value for add/replace (omit for remove) |
[- {
- "op": "replace",
- "path": "string",
- "value": null
}
]{- "resource": {
- "id": "string",
- "tenant": "string",
- "created_at": "2019-08-24T14:15:22Z",
- "updated_at": "2019-08-24T14:15:22Z",
- "owner": "string"
}, - "name": "string",
- "title": "string",
- "description": "string",
- "tags": [
- "string"
], - "runtime": {
- "k8s": {
- "image": "string",
- "entrypoint": [
- "string"
], - "cpu_request": "string",
- "memory_request": "string",
- "cpu_limit": "string",
- "memory_limit": "string",
- "env": [
- {
- "name": "string",
- "value": "string"
}
]
}, - "local": {
- "command": "string",
- "env": [
- {
- "name": "string",
- "value": "string"
}
]
}
}, - "benchmarks": [
- {
- "id": "string",
- "url": "string",
- "name": "string",
- "description": "string",
- "category": "string",
- "metrics": [
- "string"
], - "num_few_shot": 0,
- "dataset_size": 0,
- "tags": [
- "string"
], - "primary_score": {
- "metric": "string",
- "lower_is_better": false
}, - "pass_criteria": {
- "threshold": 0
}
}
]
}