agentcarousel 0.8.0

Unit tests for AI agents. Run behavioral tests in CI, score with an LLM judge, and export signed evidence your auditors accept.
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
//! Shared domain types for fixtures, runs, traces, and metrics, plus [`CoreError`] and
//! [`judge_provider`] helpers for LLM-backed judges.

pub(crate) mod hex_util;
pub mod judge_provider;
pub mod model_pricing;
pub mod models;
pub mod retry;

pub use judge_provider::{judge_key_candidates, judge_provider_from_model, JudgeProvider};
pub use model_pricing::{
    annotate_run_cost, fmt_cost, fmt_tokens, lookup_pricing, prefetch_pricing, ModelPricing,
};
pub use models::*;
pub use retry::{compute_backoff_ms, is_retryable_status, retry_policy, RetryPolicy};