Create Session Eval Run

curl --request POST \
  --url https://api.pandaprobe.com/evaluations/session-runs \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "metrics": [
    "agent_reliability",
    "agent_consistency"
  ]
}
'

import requests

url = "https://api.pandaprobe.com/evaluations/session-runs"

payload = { "metrics": ["agent_reliability", "agent_consistency"] }
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {Authorization: 'Bearer <token>', 'Content-Type': 'application/json'},
  body: JSON.stringify({metrics: ['agent_reliability', 'agent_consistency']})
};

fetch('https://api.pandaprobe.com/evaluations/session-runs', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.pandaprobe.com/evaluations/session-runs"

	payload := strings.NewReader("{\n  \"metrics\": [\n    \"agent_reliability\",\n    \"agent_consistency\"\n  ]\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

{
  "id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
  "name": "<string>",
  "metric_names": [
    "<string>"
  ],
  "total_traces": 123,
  "evaluated_count": 123,
  "failed_count": 123,
  "created_at": "<string>",
  "completed_at": "<string>",
  "project_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
  "target_type": "<string>",
  "filters": {},
  "sampling_rate": 123,
  "model": "<string>",
  "monitor_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
  "error_message": "<string>"
}

{
  "detail": [
    {
      "loc": [
        "<string>"
      ],
      "msg": "<string>",
      "type": "<string>",
      "input": "<unknown>",
      "ctx": {}
    }
  ]
}

POST

evaluations

session-runs

Create Session Eval Run

curl --request POST \
  --url https://api.pandaprobe.com/evaluations/session-runs \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "metrics": [
    "agent_reliability",
    "agent_consistency"
  ]
}
'

import requests

url = "https://api.pandaprobe.com/evaluations/session-runs"

payload = { "metrics": ["agent_reliability", "agent_consistency"] }
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {Authorization: 'Bearer <token>', 'Content-Type': 'application/json'},
  body: JSON.stringify({metrics: ['agent_reliability', 'agent_consistency']})
};

fetch('https://api.pandaprobe.com/evaluations/session-runs', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.pandaprobe.com/evaluations/session-runs"

	payload := strings.NewReader("{\n  \"metrics\": [\n    \"agent_reliability\",\n    \"agent_consistency\"\n  ]\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

{
  "id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
  "name": "<string>",
  "metric_names": [
    "<string>"
  ],
  "total_traces": 123,
  "evaluated_count": 123,
  "failed_count": 123,
  "created_at": "<string>",
  "completed_at": "<string>",
  "project_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
  "target_type": "<string>",
  "filters": {},
  "sampling_rate": 123,
  "model": "<string>",
  "monitor_id": "3c90c3cc-0d44-4b50-8888-8dd25736052a",
  "error_message": "<string>"
}

{
  "detail": [
    {
      "loc": [
        "<string>"
      ],
      "msg": "<string>",
      "type": "<string>",
      "input": "<unknown>",
      "ctx": {}
    }
  ]
}

Authorizations

Authorization

string

header

required

Bearer authentication header of the form Bearer <token>, where <token> is your auth token.

Body

application/json

Create a filter-based session eval run.

metrics

string[]

required

Session metric names (e.g. ['agent_reliability']).

Minimum array length: 1

name

string | null

Human-readable label.

filters

SessionEvalRunFilters · object

Filters for session-level evaluation runs.

Show child attributes

sampling_rate

number

default:1

Fraction of sessions to evaluate.

Required range: 0 <= x <= 1

model

string | null

LLM model override for judge calls.

signal_weights

Signal Weights · object | null

Override default signal weights.

Show child attributes

Response

Successful Response

Full eval run representation used by both list and detail endpoints.

string<uuid>

required

name

string | null

required

status

enum<string>

required

Lifecycle status of an evaluation job.

Available options:

PENDING,

RUNNING,

COMPLETED,

FAILED

metric_names

string[]

required

total_traces

integer

required

evaluated_count

integer

required

failed_count

integer

required

created_at

string

required

completed_at

string | null

required

project_id

string<uuid>

required

target_type

string

required

filters

Filters · object

required

sampling_rate

number

required

model

string | null

required

monitor_id

string<uuid> | null

required

error_message

string | null

required

Get Available Session Metrics List Session Eval Runs