Struct EvalRunner

Source

pub struct EvalRunner { /* private fields */ }

Expand description

Evaluation runner using Orchestrator directly

§Example

let runner = EvalRunner::new(scenario, runtime.handle().clone())
    .with_runs(5)
    .with_seed(42)
    .with_task(SwarmTask::new("Find the auth handler"))
    .with_manager_factory(|| Box::new(MyManager::new()))
    .with_batch_invoker_factory(|| Box::new(MyInvoker::new()));

let report = runner.run()?;

Implementations§

Source §

impl EvalRunner

Source

pub fn new(scenario: EvalScenario, runtime: Handle) -> Self

Source

pub fn with_verbose(self, verbose: bool) -> Self

Enable verbose output (print tick snapshots)

Source

pub fn with_exploration(self, enable: bool) -> Self

Enable ExplorationSpace tracking

Source

pub fn with_dependency_graph(self, graph: DependencyGraph) -> Self

Set dependency graph for action sequencing

The graph defines valid action transitions and terminal conditions. When set, actions will be filtered based on the graph structure.

Source

pub fn with_learning_store(self, path: impl AsRef<Path>) -> Self

Enable LearningStore for cross-session learning

When enabled, statistics will be saved after each run and loaded as prior for subsequent runs. This enables incremental learning across sessions.

§Example

runner.with_learning_store("~/.swarm-engine/learning")

Source

pub fn with_train_trigger(self, trigger: Arc<dyn TrainTrigger>) -> Self

Set TrainTrigger for Learning

Controls when offline learning is executed after eval runs. Default: Learn after every run (if learning_store is configured).

§Example

use swarm_engine_core::learn::CountTrigger;

// Run learning after every 5 eval iterations
runner.with_train_trigger(Arc::new(CountTrigger::new(5)))

Source

pub fn skip_learned_action_order(self, skip: bool) -> Self

Skip learned action order from offline model

When enabled, the learned dependency graph (action_order) from the offline model will not be applied. This is useful for testing without learned priors.

Source

pub fn with_trace_subscriber(self, subscriber: Arc<dyn TraceSubscriber>) -> Self

Set trace subscriber for ActionEvent output

The subscriber will receive all ActionEvents during evaluation. Use InMemoryTraceSubscriber to collect events and dump them after evaluation, or JsonlTraceSubscriber for real-time output.

§Example

use std::sync::Arc;
use swarm_engine_core::events::InMemoryTraceSubscriber;

let trace = Arc::new(InMemoryTraceSubscriber::new());
runner.with_trace_subscriber(trace.clone());
// ... run evaluation ...
trace.dump_to_file("trace.jsonl")?;

Source

pub fn with_scenario_profile(self, profile: ScenarioProfile) -> Self

Apply a ScenarioProfile to use learned exploration parameters and strategies

This converts the profile to an OfflineModel and applies it during execution. When set, the profile’s learned components (exploration params, strategy config, action order) will be used instead of defaults.

§Example

let store = ProfileStore::new("~/.swarm-engine/profiles")?;
let profile = store.load("troubleshooting")?;
runner.with_scenario_profile(profile);

Source

pub fn with_runs(self, runs: usize) -> Self

Source

pub fn with_seed(self, seed: u64) -> Self

Source

pub fn with_task(self, task: SwarmTask) -> Self

Set the task to execute

Source

pub fn with_manager_factory<F>(self, factory: F) -> Self
where F: Fn() -> Box<dyn ManagerAgent> + Send + Sync + 'static,

Set manager factory (creates new Manager for each run)

Source

pub fn with_batch_invoker_factory<F>(self, factory: F) -> Self
where F: Fn() -> Box<dyn BatchInvoker> + Send + Sync + 'static,

Set batch invoker factory (creates new BatchInvoker for each run)

Source

pub fn with_extensions_factory<F>(self, factory: F) -> Self
where F: Fn() -> Extensions + Send + Sync + 'static,

Set extensions factory (creates new Extensions for each run)

Source

pub fn with_operator_provider_factory<F>(self, factory: F) -> Self
where F: Fn() -> Box<dyn OperatorProvider<NodeRules>> + Send + Sync + 'static,

Set OperatorProvider factory (creates new provider for each run)

Use this to configure the Selection strategy for exploration. Default is AdaptiveProvider if not specified.

§Example

use swarm_engine_core::exploration::{HybridLlmProvider, ReviewPolicy};
use swarm_engine_llm::LlmStrategyAdvisor;

runner.with_operator_provider_factory(|| {
    let advisor = LlmStrategyAdvisor::new(decider.clone(), handle.clone());
    let policy = ReviewPolicy::default();
    Box::new(HybridLlmProvider::new(advisor, policy))
})

Source

pub fn run(&self) -> Result<EvalReport>

Auto Trait Implementations§

§

impl !UnwindSafe for EvalRunner

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T> Instrument for T

Source §

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more

Source §

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> IntoEither for T

Source §

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

impl<T> Pointable for T

Source §

const ALIGN: usize

The alignment of pointer.

Source §

type Init = T

The type for initializers.

Source §

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more

Source §

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more

Source §

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more

Source §

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more

Source §

impl<T> PolicyExt for T
where T: ?Sized,

Source §

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

Create a new Policy that returns Action::Follow only if self and other return Action::Follow. Read more

Source §

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

Create a new Policy that returns Action::Follow if either self or other returns Action::Follow. Read more

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Source §

impl<T> WithSubscriber for T

Source §

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a WithDispatch wrapper. Read more

Source §

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a WithDispatch wrapper. Read more

EvalRunner

Struct EvalRunner Copy item path

§Example

Implementations§

impl EvalRunner

pub fn new(scenario: EvalScenario, runtime: Handle) -> Self

pub fn with_verbose(self, verbose: bool) -> Self

pub fn with_exploration(self, enable: bool) -> Self

pub fn with_dependency_graph(self, graph: DependencyGraph) -> Self

pub fn with_learning_store(self, path: impl AsRef<Path>) -> Self

§Example

pub fn with_train_trigger(self, trigger: Arc<dyn TrainTrigger>) -> Self

§Example

pub fn skip_learned_action_order(self, skip: bool) -> Self

pub fn with_trace_subscriber(self, subscriber: Arc<dyn TraceSubscriber>) -> Self

§Example

pub fn with_scenario_profile(self, profile: ScenarioProfile) -> Self

§Example

pub fn with_runs(self, runs: usize) -> Self

pub fn with_seed(self, seed: u64) -> Self

pub fn with_task(self, task: SwarmTask) -> Self

pub fn with_manager_factory<F>(self, factory: F) -> Selfwhere F: Fn() -> Box<dyn ManagerAgent> + Send + Sync + 'static,

pub fn with_batch_invoker_factory<F>(self, factory: F) -> Selfwhere F: Fn() -> Box<dyn BatchInvoker> + Send + Sync + 'static,

pub fn with_extensions_factory<F>(self, factory: F) -> Selfwhere F: Fn() -> Extensions + Send + Sync + 'static,

pub fn with_operator_provider_factory<F>(self, factory: F) -> Selfwhere F: Fn() -> Box<dyn OperatorProvider<NodeRules>> + Send + Sync + 'static,

§Example

pub fn run(&self) -> Result<EvalReport>

Auto Trait Implementations§

impl Freeze for EvalRunner

impl !RefUnwindSafe for EvalRunner

impl Send for EvalRunner

impl Sync for EvalRunner

impl Unpin for EvalRunner

impl !UnwindSafe for EvalRunner

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> PolicyExt for Twhere T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>where T: Policy<B, E>, P: Policy<B, E>,

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct EvalRunner

pub fn with_manager_factory<F>(self, factory: F) -> Self
where F: Fn() -> Box<dyn ManagerAgent> + Send + Sync + 'static,

pub fn with_batch_invoker_factory<F>(self, factory: F) -> Self
where F: Fn() -> Box<dyn BatchInvoker> + Send + Sync + 'static,

pub fn with_extensions_factory<F>(self, factory: F) -> Self
where F: Fn() -> Extensions + Send + Sync + 'static,

pub fn with_operator_provider_factory<F>(self, factory: F) -> Self
where F: Fn() -> Box<dyn OperatorProvider<NodeRules>> + Send + Sync + 'static,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,