Batch Evaluate

POST

api

batch

evaluate

cURL

curl --request POST \
  --url https://labs.tacitintelligence.co/api/v1/batch/evaluate \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "items": [
    {
      "id": "<string>",
      "collection_slug": "<string>",
      "scenario_slug": "<string>",
      "messages": [
        {
          "content": "<string>",
          "tool_calls": [
            {
              "name": "<string>",
              "input": {}
            }
          ]
        }
      ],
      "normalization_key": "<string>",
      "normalization_windows": [
        "<string>"
      ]
    }
  ]
}
'

import requests

url = "https://labs.tacitintelligence.co/api/v1/batch/evaluate"

payload = { "items": [
        {
            "id": "<string>",
            "collection_slug": "<string>",
            "scenario_slug": "<string>",
            "messages": [
                {
                    "content": "<string>",
                    "tool_calls": [
                        {
                            "name": "<string>",
                            "input": {}
                        }
                    ]
                }
            ],
            "normalization_key": "<string>",
            "normalization_windows": ["<string>"]
        }
    ] }
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {Authorization: 'Bearer <token>', 'Content-Type': 'application/json'},
  body: JSON.stringify({
    items: [
      {
        id: '<string>',
        collection_slug: '<string>',
        scenario_slug: '<string>',
        messages: [{content: '<string>', tool_calls: [{name: '<string>', input: {}}]}],
        normalization_key: '<string>',
        normalization_windows: ['<string>']
      }
    ]
  })
};

fetch('https://labs.tacitintelligence.co/api/v1/batch/evaluate', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://labs.tacitintelligence.co/api/v1/batch/evaluate",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'items' => [
        [
                'id' => '<string>',
                'collection_slug' => '<string>',
                'scenario_slug' => '<string>',
                'messages' => [
                                [
                                                                'content' => '<string>',
                                                                'tool_calls' => [
                                                                                                                                [
                                                                                                                                                                                                                                                                'name' => '<string>',
                                                                                                                                                                                                                                                                'input' => [
                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                
                                                                                                                                                                                                                                                                ]
                                                                                                                                ]
                                                                ]
                                ]
                ],
                'normalization_key' => '<string>',
                'normalization_windows' => [
                                '<string>'
                ]
        ]
    ]
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://labs.tacitintelligence.co/api/v1/batch/evaluate"

	payload := strings.NewReader("{\n  \"items\": [\n    {\n      \"id\": \"<string>\",\n      \"collection_slug\": \"<string>\",\n      \"scenario_slug\": \"<string>\",\n      \"messages\": [\n        {\n          \"content\": \"<string>\",\n          \"tool_calls\": [\n            {\n              \"name\": \"<string>\",\n              \"input\": {}\n            }\n          ]\n        }\n      ],\n      \"normalization_key\": \"<string>\",\n      \"normalization_windows\": [\n        \"<string>\"\n      ]\n    }\n  ]\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://labs.tacitintelligence.co/api/v1/batch/evaluate")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"items\": [\n    {\n      \"id\": \"<string>\",\n      \"collection_slug\": \"<string>\",\n      \"scenario_slug\": \"<string>\",\n      \"messages\": [\n        {\n          \"content\": \"<string>\",\n          \"tool_calls\": [\n            {\n              \"name\": \"<string>\",\n              \"input\": {}\n            }\n          ]\n        }\n      ],\n      \"normalization_key\": \"<string>\",\n      \"normalization_windows\": [\n        \"<string>\"\n      ]\n    }\n  ]\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://labs.tacitintelligence.co/api/v1/batch/evaluate")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"items\": [\n    {\n      \"id\": \"<string>\",\n      \"collection_slug\": \"<string>\",\n      \"scenario_slug\": \"<string>\",\n      \"messages\": [\n        {\n          \"content\": \"<string>\",\n          \"tool_calls\": [\n            {\n              \"name\": \"<string>\",\n              \"input\": {}\n            }\n          ]\n        }\n      ],\n      \"normalization_key\": \"<string>\",\n      \"normalization_windows\": [\n        \"<string>\"\n      ]\n    }\n  ]\n}"

response = http.request(request)
puts response.read_body

{
  "results": [
    {
      "id": "<string>",
      "status": "<string>",
      "reward": 0.5,
      "scores": {},
      "score_breakdown": {},
      "normalized": {}
    }
  ],
  "scoring_version": "<string>",
  "total_time_ms": 123
}

{
  "error": "<string>",
  "details": {}
}

Authorizations

Authorization

string

header

required

API key obtained from Labs Portal

Body

application/json

items

object[]

required

Array of evaluation items (1-100 items per batch)

Required array length: 1 - 100 elements

Show child attributes

Response

Success

results

object[]

required

Results for each item in the batch

Each result is either a success (with reward and scores) or an error (with error message). Check the status field to distinguish - error items have no reward and must not be used for training.

Option 1
Option 2

Show child attributes

scoring_version

string

required

Version of the scoring algorithm used

total_time_ms

number

required

Total time to process the batch in milliseconds

ComparePairwise comparison for preference-based training (DPO). Compare two responses and determine which is better.

cURL

curl --request POST \
  --url https://labs.tacitintelligence.co/api/v1/batch/evaluate \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "items": [
    {
      "id": "<string>",
      "collection_slug": "<string>",
      "scenario_slug": "<string>",
      "messages": [
        {
          "content": "<string>",
          "tool_calls": [
            {
              "name": "<string>",
              "input": {}
            }
          ]
        }
      ],
      "normalization_key": "<string>",
      "normalization_windows": [
        "<string>"
      ]
    }
  ]
}
'

import requests

url = "https://labs.tacitintelligence.co/api/v1/batch/evaluate"

payload = { "items": [
        {
            "id": "<string>",
            "collection_slug": "<string>",
            "scenario_slug": "<string>",
            "messages": [
                {
                    "content": "<string>",
                    "tool_calls": [
                        {
                            "name": "<string>",
                            "input": {}
                        }
                    ]
                }
            ],
            "normalization_key": "<string>",
            "normalization_windows": ["<string>"]
        }
    ] }
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {Authorization: 'Bearer <token>', 'Content-Type': 'application/json'},
  body: JSON.stringify({
    items: [
      {
        id: '<string>',
        collection_slug: '<string>',
        scenario_slug: '<string>',
        messages: [{content: '<string>', tool_calls: [{name: '<string>', input: {}}]}],
        normalization_key: '<string>',
        normalization_windows: ['<string>']
      }
    ]
  })
};

fetch('https://labs.tacitintelligence.co/api/v1/batch/evaluate', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://labs.tacitintelligence.co/api/v1/batch/evaluate",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'items' => [
        [
                'id' => '<string>',
                'collection_slug' => '<string>',
                'scenario_slug' => '<string>',
                'messages' => [
                                [
                                                                'content' => '<string>',
                                                                'tool_calls' => [
                                                                                                                                [
                                                                                                                                                                                                                                                                'name' => '<string>',
                                                                                                                                                                                                                                                                'input' => [
                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                
                                                                                                                                                                                                                                                                ]
                                                                                                                                ]
                                                                ]
                                ]
                ],
                'normalization_key' => '<string>',
                'normalization_windows' => [
                                '<string>'
                ]
        ]
    ]
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://labs.tacitintelligence.co/api/v1/batch/evaluate"

	payload := strings.NewReader("{\n  \"items\": [\n    {\n      \"id\": \"<string>\",\n      \"collection_slug\": \"<string>\",\n      \"scenario_slug\": \"<string>\",\n      \"messages\": [\n        {\n          \"content\": \"<string>\",\n          \"tool_calls\": [\n            {\n              \"name\": \"<string>\",\n              \"input\": {}\n            }\n          ]\n        }\n      ],\n      \"normalization_key\": \"<string>\",\n      \"normalization_windows\": [\n        \"<string>\"\n      ]\n    }\n  ]\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://labs.tacitintelligence.co/api/v1/batch/evaluate")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"items\": [\n    {\n      \"id\": \"<string>\",\n      \"collection_slug\": \"<string>\",\n      \"scenario_slug\": \"<string>\",\n      \"messages\": [\n        {\n          \"content\": \"<string>\",\n          \"tool_calls\": [\n            {\n              \"name\": \"<string>\",\n              \"input\": {}\n            }\n          ]\n        }\n      ],\n      \"normalization_key\": \"<string>\",\n      \"normalization_windows\": [\n        \"<string>\"\n      ]\n    }\n  ]\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://labs.tacitintelligence.co/api/v1/batch/evaluate")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"items\": [\n    {\n      \"id\": \"<string>\",\n      \"collection_slug\": \"<string>\",\n      \"scenario_slug\": \"<string>\",\n      \"messages\": [\n        {\n          \"content\": \"<string>\",\n          \"tool_calls\": [\n            {\n              \"name\": \"<string>\",\n              \"input\": {}\n            }\n          ]\n        }\n      ],\n      \"normalization_key\": \"<string>\",\n      \"normalization_windows\": [\n        \"<string>\"\n      ]\n    }\n  ]\n}"

response = http.request(request)
puts response.read_body

{
  "results": [
    {
      "id": "<string>",
      "status": "<string>",
      "reward": 0.5,
      "scores": {},
      "score_breakdown": {},
      "normalized": {}
    }
  ],
  "scoring_version": "<string>",
  "total_time_ms": 123
}

{
  "error": "<string>",
  "details": {}
}

Overview

Catalog

Episodes

Evaluation

Key

Training Datasets

Authorizations

Body

Response