trictrac/bot/src/burnrl/main.rs

61 lines
2 KiB
Rust

use bot::burnrl::{dqn_model, environment, utils::demo_model};
use burn::backend::{ndarray::NdArrayDevice, Autodiff, NdArray};
use burn::module::Module;
use burn::record::{CompactRecorder, Recorder};
use burn_rl::agent::DQN;
use burn_rl::base::{Action, Agent, ElemType, Environment, State};
type Backend = Autodiff<NdArray<ElemType>>;
type Env = environment::TrictracEnvironment;
fn main() {
println!("> Entraînement");
let num_episodes = 3;
let agent = dqn_model::run::<Env, Backend>(num_episodes, false); //true);
println!("> Sauvegarde du modèle de validation");
save_model(agent.model().as_ref().unwrap());
println!("> Chargement du modèle pour test");
let loaded_model = load_model();
let loaded_agent = DQN::new(loaded_model);
println!("> Test avec le modèle chargé");
demo_model(loaded_agent, |env| env.valid_actions());
}
fn save_model(model: &dqn_model::Net<NdArray<ElemType>>) {
let path = "models/burn_dqn".to_string();
let recorder = CompactRecorder::new();
let model_path = format!("{}_model.burn", path);
println!("Modèle de validation sauvegardé : {}", model_path);
recorder
.record(model.clone().into_record(), model_path.into())
.unwrap();
}
fn load_model() -> dqn_model::Net<NdArray<ElemType>> {
// TODO : reprendre le DENSE_SIZE de dqn_model.rs
const DENSE_SIZE: usize = 128;
let path = "models/burn_dqn".to_string();
let model_path = format!("{}_model.burn", path);
println!("Chargement du modèle depuis : {}", model_path);
let device = NdArrayDevice::default();
let recorder = CompactRecorder::new();
let record = recorder
.load(model_path.into(), &device)
.expect("Impossible de charger le modèle");
dqn_model::Net::new(
<environment::TrictracEnvironment as Environment>::StateType::size(),
DENSE_SIZE,
<environment::TrictracEnvironment as Environment>::ActionType::size(),
&device,
)
.load_record(record)
}