POST/api/v1/evals/pairwise

Create a pairwise comparison or submit a vote

Action-discriminated. action='create' inserts a head-to-head A-vs-B comparison; action='vote' records a winner (a|b|tie), updates ELO ratings, and completes the comparison. projectId is required for both.

Authentication

Send Authorization: Bearer YOUR_API_KEY on every request. Generate API keys at /dashboard/api-keys.

Request body required

Schema

{
  "application/json": {
    "schema": {
      "oneOf": [
        {
          "type": "object",
          "properties": {
            "action": {
              "type": "string",
              "enum": [
                "create"
              ]
            },
            "projectId": {
              "type": "string",
              "format": "uuid",
              "pattern": "^([0-9a-fA-F]{8}-[0-9a-fA-F]{4}-[1-8][0-9a-fA-F]{3}-[89abAB][0-9a-fA-F]{3}-[0-9a-fA-F]{12}|00000000-0000-0000-0000-000000000000|ffffffff-ffff-ffff-ffff-ffffffffffff)$"
            },
            "inputText": {
              "type": "string",
              "minLength": 1,
              "maxLength": 100000
            },
            "responseA": {
              "type": "string",
              "minLength": 1,
              "maxLength": 100000
            },
            "responseB": {
              "type": "string",
              "minLength": 1,
              "maxLength": 100000
            },
            "modelA": {
              "type": "string",
              "maxLength": 120
            },
            "modelB": {
              "type": "string",
              "maxLength": 120
            },
            "metadata": {
              "type": "object",
              "additionalProperties": {}
            }
          },
          "required": [
            "action",
            "projectId",
            "inputText",
            "responseA",
            "responseB"
          ],
          "additionalProperties": false
        },
        {
          "type": "object",
          "properties": {
            "action": {
              "type": "string",
              "enum": [
                "vote"
              ]
            },
            "projectId": {
              "type": "string",
              "format": "uuid",
              "pattern": "^([0-9a-fA-F]{8}-[0-9a-fA-F]{4}-[1-8][0-9a-fA-F]{3}-[89abAB][0-9a-fA-F]{3}-[0-9a-fA-F]{12}|00000000-0000-0000-0000-000000000000|ffffffff-ffff-ffff-ffff-ffffffffffff)$"
            },
            "comparisonId": {
              "type": "string",
              "format": "uuid",
              "pattern": "^([0-9a-fA-F]{8}-[0-9a-fA-F]{4}-[1-8][0-9a-fA-F]{3}-[89abAB][0-9a-fA-F]{3}-[0-9a-fA-F]{12}|00000000-0000-0000-0000-000000000000|ffffffff-ffff-ffff-ffff-ffffffffffff)$"
            },
            "winner": {
              "type": "string",
              "enum": [
                "a",
                "b",
                "tie"
              ]
            },
            "feedback": {
              "type": "string",
              "maxLength": 20000
            }
          },
          "required": [
            "action",
            "projectId",
            "comparisonId",
            "winner"
          ],
          "additionalProperties": false
        }
      ]
    }
  }
}

Response

200 example

{
  "success": true
}

All status codes

200Vote recorded; ELO updated.

201Comparison created.

400(no description)

401(no description)

404(no description)

429(no description)

Code samples

cURL

curl -X POST \
  https://evalguard.ai/api/v1/evals/pairwise \
  -H "Authorization: Bearer $EVALGUARD_API_KEY" \

TypeScript

import { EvalGuard } from "@evalguard/sdk";

const client = new EvalGuard({ apiKey: process.env.EVALGUARD_API_KEY });

const response = await client.request({
  method: "POST",
  path: "/api/v1/evals/pairwise",
});
console.log(response);

Python

from evalguard import EvalGuard
import os

client = EvalGuard(api_key=os.environ["EVALGUARD_API_KEY"])

response = client.request(method="POST", path="/api/v1/evals/pairwise")
print(response)

package main

import (
	"context"
	"fmt"
	"net/http"
	"os"
)

func main() {
	req, _ := http.NewRequestWithContext(context.Background(), "POST", "https://evalguard.ai/api/v1/evals/pairwise", nil)
	req.Header.Set("Authorization", "Bearer "+os.Getenv("EVALGUARD_API_KEY"))
	resp, err := http.DefaultClient.Do(req)
	if err != nil { panic(err) }
	defer resp.Body.Close()
	fmt.Println(resp.Status)
}

Errors

400401404429

Request body required

Response

Code samples

Errors

Other Evals endpoints