Submit evaluation result

curl --request POST \
  --url https://agent-evalserver-production.up.railway.app/api/agents/{agentId}/test-results/{promptId} \
  --header 'Content-Type: application/json' \
  --header 'x-api-key: <api-key>' \
  --data '
{
  "status": "passed",
  "response": "Customers can request a refund within 30 days of purchase.",
  "expectedAnswer": "Customers can request a refund within 30 days.",
  "hallucinationLabel": "FactIsPresent",
  "hallucinationFindings": []
}
'

import requests

url = "https://agent-evalserver-production.up.railway.app/api/agents/{agentId}/test-results/{promptId}"

payload = {
    "status": "passed",
    "response": "Customers can request a refund within 30 days of purchase.",
    "expectedAnswer": "Customers can request a refund within 30 days.",
    "hallucinationLabel": "FactIsPresent",
    "hallucinationFindings": []
}
headers = {
    "x-api-key": "<api-key>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'x-api-key': '<api-key>', 'Content-Type': 'application/json'},
  body: JSON.stringify({
    status: 'passed',
    response: 'Customers can request a refund within 30 days of purchase.',
    expectedAnswer: 'Customers can request a refund within 30 days.',
    hallucinationLabel: 'FactIsPresent',
    hallucinationFindings: []
  })
};

fetch('https://agent-evalserver-production.up.railway.app/api/agents/{agentId}/test-results/{promptId}', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://agent-evalserver-production.up.railway.app/api/agents/{agentId}/test-results/{promptId}",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'status' => 'passed',
    'response' => 'Customers can request a refund within 30 days of purchase.',
    'expectedAnswer' => 'Customers can request a refund within 30 days.',
    'hallucinationLabel' => 'FactIsPresent',
    'hallucinationFindings' => [
        
    ]
  ]),
  CURLOPT_HTTPHEADER => [
    "Content-Type: application/json",
    "x-api-key: <api-key>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://agent-evalserver-production.up.railway.app/api/agents/{agentId}/test-results/{promptId}"

	payload := strings.NewReader("{\n  \"status\": \"passed\",\n  \"response\": \"Customers can request a refund within 30 days of purchase.\",\n  \"expectedAnswer\": \"Customers can request a refund within 30 days.\",\n  \"hallucinationLabel\": \"FactIsPresent\",\n  \"hallucinationFindings\": []\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("x-api-key", "<api-key>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://agent-evalserver-production.up.railway.app/api/agents/{agentId}/test-results/{promptId}")
  .header("x-api-key", "<api-key>")
  .header("Content-Type", "application/json")
  .body("{\n  \"status\": \"passed\",\n  \"response\": \"Customers can request a refund within 30 days of purchase.\",\n  \"expectedAnswer\": \"Customers can request a refund within 30 days.\",\n  \"hallucinationLabel\": \"FactIsPresent\",\n  \"hallucinationFindings\": []\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://agent-evalserver-production.up.railway.app/api/agents/{agentId}/test-results/{promptId}")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["x-api-key"] = '<api-key>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"status\": \"passed\",\n  \"response\": \"Customers can request a refund within 30 days of purchase.\",\n  \"expectedAnswer\": \"Customers can request a refund within 30 days.\",\n  \"hallucinationLabel\": \"FactIsPresent\",\n  \"hallucinationFindings\": []\n}"

response = http.request(request)
puts response.read_body

{
  "id": "4a2dc063-36f8-47b0-a703-bb2d7d4e44f5",
  "agentId": "2f7e9c9c-9a2e-4e3a-b77f-6d9d1a7e3a11",
  "promptId": 42,
  "status": "passed",
  "sessionId": null,
  "response": "Customers can request a refund within 30 days of purchase.",
  "expectedAnswer": "Customers can request a refund within 30 days.",
  "hallucinationLabel": "FactIsPresent",
  "hallucinationFindings": [],
  "created_at": "2026-06-02T15:20:00Z",
  "updated_at": "2026-06-02T15:21:00Z"
}

POST

api

agents

{agentId}

test-results

{promptId}

Submit evaluation result

curl --request POST \
  --url https://agent-evalserver-production.up.railway.app/api/agents/{agentId}/test-results/{promptId} \
  --header 'Content-Type: application/json' \
  --header 'x-api-key: <api-key>' \
  --data '
{
  "status": "passed",
  "response": "Customers can request a refund within 30 days of purchase.",
  "expectedAnswer": "Customers can request a refund within 30 days.",
  "hallucinationLabel": "FactIsPresent",
  "hallucinationFindings": []
}
'

import requests

url = "https://agent-evalserver-production.up.railway.app/api/agents/{agentId}/test-results/{promptId}"

payload = {
    "status": "passed",
    "response": "Customers can request a refund within 30 days of purchase.",
    "expectedAnswer": "Customers can request a refund within 30 days.",
    "hallucinationLabel": "FactIsPresent",
    "hallucinationFindings": []
}
headers = {
    "x-api-key": "<api-key>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'x-api-key': '<api-key>', 'Content-Type': 'application/json'},
  body: JSON.stringify({
    status: 'passed',
    response: 'Customers can request a refund within 30 days of purchase.',
    expectedAnswer: 'Customers can request a refund within 30 days.',
    hallucinationLabel: 'FactIsPresent',
    hallucinationFindings: []
  })
};

fetch('https://agent-evalserver-production.up.railway.app/api/agents/{agentId}/test-results/{promptId}', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://agent-evalserver-production.up.railway.app/api/agents/{agentId}/test-results/{promptId}",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'status' => 'passed',
    'response' => 'Customers can request a refund within 30 days of purchase.',
    'expectedAnswer' => 'Customers can request a refund within 30 days.',
    'hallucinationLabel' => 'FactIsPresent',
    'hallucinationFindings' => [
        
    ]
  ]),
  CURLOPT_HTTPHEADER => [
    "Content-Type: application/json",
    "x-api-key: <api-key>"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://agent-evalserver-production.up.railway.app/api/agents/{agentId}/test-results/{promptId}"

	payload := strings.NewReader("{\n  \"status\": \"passed\",\n  \"response\": \"Customers can request a refund within 30 days of purchase.\",\n  \"expectedAnswer\": \"Customers can request a refund within 30 days.\",\n  \"hallucinationLabel\": \"FactIsPresent\",\n  \"hallucinationFindings\": []\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("x-api-key", "<api-key>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://agent-evalserver-production.up.railway.app/api/agents/{agentId}/test-results/{promptId}")
  .header("x-api-key", "<api-key>")
  .header("Content-Type", "application/json")
  .body("{\n  \"status\": \"passed\",\n  \"response\": \"Customers can request a refund within 30 days of purchase.\",\n  \"expectedAnswer\": \"Customers can request a refund within 30 days.\",\n  \"hallucinationLabel\": \"FactIsPresent\",\n  \"hallucinationFindings\": []\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://agent-evalserver-production.up.railway.app/api/agents/{agentId}/test-results/{promptId}")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["x-api-key"] = '<api-key>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"status\": \"passed\",\n  \"response\": \"Customers can request a refund within 30 days of purchase.\",\n  \"expectedAnswer\": \"Customers can request a refund within 30 days.\",\n  \"hallucinationLabel\": \"FactIsPresent\",\n  \"hallucinationFindings\": []\n}"

response = http.request(request)
puts response.read_body

{
  "id": "4a2dc063-36f8-47b0-a703-bb2d7d4e44f5",
  "agentId": "2f7e9c9c-9a2e-4e3a-b77f-6d9d1a7e3a11",
  "promptId": 42,
  "status": "passed",
  "sessionId": null,
  "response": "Customers can request a refund within 30 days of purchase.",
  "expectedAnswer": "Customers can request a refund within 30 days.",
  "hallucinationLabel": "FactIsPresent",
  "hallucinationFindings": [],
  "created_at": "2026-06-02T15:20:00Z",
  "updated_at": "2026-06-02T15:21:00Z"
}

Authorizations

x-api-key

string

header

required

Platform API key for authenticated account-level API access

Path Parameters

agentId

string<uuid>

required

Evaluation agent ID.

promptId

integer

required

Question ID returned by Add evaluation questions.

Body

application/json

Submit the agent response and evaluation outcome for a prompt.

status

enum<string>

required

Evaluation outcome.

Available options:

passed,

failed,

ambiguous

Example:

"passed"

response

string

required

Agent response to the prompt.

Example:

"Customers can request a refund within 30 days of purchase."

expectedAnswer

string | null

Reference answer used for evaluation.

Example:

"Customers can request a refund within 30 days."

hallucinationLabel

string | null

Optional hallucination label returned by your evaluation step.

Example:

"FactIsPresent"

hallucinationFindings

object[] | null

Optional fact-level findings returned by your evaluation step.

Example:

[]

Response

200 - application/json

Test result stored

Stored evaluation result for one prompt.

string<uuid>

Unique result identifier.

Example:

"4a2dc063-36f8-47b0-a703-bb2d7d4e44f5"

agentId

string<uuid>

Evaluation agent ID.

Example:

"2f7e9c9c-9a2e-4e3a-b77f-6d9d1a7e3a11"

promptId

integer

Prompt ID this result belongs to.

Example:

42

status

enum<string>

Evaluation outcome.

Available options:

passed,

failed,

ambiguous

Example:

"passed"

sessionId

string<uuid> | null

Optional session identifier associated with the result.

Example:

"a75b1bb5-0c7c-4302-978e-e2452b79df26"

response

string | null

Agent response that was evaluated.

Example:

"Customers can request a refund within 30 days of purchase."

expectedAnswer

string | null

Reference answer used for evaluation.

Example:

"Customers can request a refund within 30 days."

hallucinationLabel

string | null

Hallucination label returned by the evaluator, when available.

Example:

"FactIsPresent"

hallucinationFindings

object[] | null

Fact-level findings returned by the evaluator.

Example:

[]

created_at

string<date-time>

Creation timestamp.

Example:

"2026-06-02T15:20:00Z"

updated_at

string<date-time>

Last update timestamp.

Example:

"2026-06-02T15:21:00Z"

Delete evaluation question View evaluation results

Overview

Evaluation API

Submit evaluation result

Authorizations

Path Parameters

Body

Response