Interface EvalRun

A complete evaluation run.

interface EvalRun {
    runId: string;
    name: string;
    agentId?: string;
    personaId?: string;
    modelId?: string;
    startedAt: string;
    completedAt?: string;
    status: "completed" | "failed" | "pending" | "running";
    results: EvalTestResult[];
    aggregateMetrics: AggregateMetrics;
    config?: EvalConfig;
    metadata?: Record<string, unknown>;
}

Properties

runId: string

Run ID

name: string

Run name/description

agentId?: string

Agent or persona being evaluated

personaId?: string
modelId?: string

Model being used

startedAt: string

Timestamp started

completedAt?: string

Timestamp completed

status: "completed" | "failed" | "pending" | "running"

Status

results: EvalTestResult[]

Individual test results

aggregateMetrics: AggregateMetrics

Aggregate metrics

config?: EvalConfig

Configuration used

metadata?: Record<string, unknown>

Metadata