[package]
name = "agentic-eval"
version = "0.14.2"
edition = "2021"
description = "Evaluate programs, CLI commands, programming languages, AI frameworks, and VM/sandbox systems for agentic AI use across four axes — token efficiency, determinism, reliability, and safety — under popular tokenizers (OpenAI GPT-4/GPT-4o, Anthropic Claude). Includes a CLI effect classifier, curated language/framework/VM profiles, and a self-describing ontology."
license = "AGPL-3.0-or-later"
authors = ["NERVOSYS <opensource@nervosys.ai>"]
repository = "https://github.com/nervosys/AetherShell"
homepage = "https://github.com/nervosys/AetherShell/tree/master/crates/agentic-eval"
documentation = "https://docs.rs/agentic-eval"
readme = "README.md"
keywords = ["llm", "agent", "tokens", "determinism", "safety"]
categories = ["development-tools", "text-processing"]
rust-version = "1.75"
[package.metadata.docs.rs]
all-features = true
[features]
default = []
real-tokens = ["dep:tiktoken-rs"]
serde = ["dep:serde"]
[dependencies]
tiktoken-rs = { version = "0.6", optional = true }
serde = { version = "1", features = ["derive"], optional = true }
[[example]]
name = "evaluate"
path = "examples/evaluate.rs"
[[example]]
name = "vm_benchmark"
path = "examples/vm_benchmark.rs"
[[example]]
name = "web_benchmark"
path = "examples/web_benchmark.rs"