use anyhow::Result;
use border_atari_env::{
BorderAtariAct, BorderAtariActRawFilter, BorderAtariEnv, BorderAtariEnvConfig, BorderAtariObs,
BorderAtariObsRawFilter,
};
use border_core::{
Agent, Configurable, DefaultEvaluator, Env as _, Evaluator, NullReplayBuffer, Policy,
};
use serde::Deserialize;
type Obs = BorderAtariObs;
type Act = BorderAtariAct;
type ObsFilter = BorderAtariObsRawFilter<Obs>;
type ActFilter = BorderAtariActRawFilter<Act>;
type EnvConfig = BorderAtariEnvConfig<Obs, Act, ObsFilter, ActFilter>;
type Env = BorderAtariEnv<Obs, Act, ObsFilter, ActFilter>;
#[derive(Clone, Deserialize)]
struct RandomPolicyConfig {
pub n_acts: usize,
}
struct RandomPolicy {
n_acts: usize,
}
impl Policy<Env> for RandomPolicy {
fn sample(&mut self, _: &Obs) -> Act {
fastrand::u8(..self.n_acts as u8).into()
}
}
impl Agent<Env, NullReplayBuffer> for RandomPolicy {}
impl Configurable for RandomPolicy {
type Config = RandomPolicyConfig;
fn build(config: Self::Config) -> Self {
Self {
n_acts: config.n_acts,
}
}
}
fn env_config(name: String) -> EnvConfig {
EnvConfig::default().name(name)
}
fn main() -> Result<()> {
env_logger::Builder::from_env(env_logger::Env::default().default_filter_or("info")).init();
fastrand::seed(42);
let env_config = env_config("pong".to_string()).render(true);
let mut policy = {
let policy_config = {
let n_acts = {
let env = Env::build(&env_config, 42)?;
env.get_num_actions_atari()
};
RandomPolicyConfig {
n_acts: n_acts as _,
}
};
Box::new(RandomPolicy::build(policy_config)) as _
};
let env_config = env_config.render(true);
let _ = DefaultEvaluator::new(&env_config, 42, 5)?.evaluate(&mut policy);
Ok(())
}