will-maclean
diff --git a/‎.github/workflows/cov.yml‎
Lines changed: 11 additions & 3 deletions b/‎.github/workflows/cov.yml‎
Lines changed: 11 additions & 3 deletions
diff --git a/‎.github/workflows/rust.yml‎
Lines changed: 9 additions & 1 deletion b/‎.github/workflows/rust.yml‎
Lines changed: 9 additions & 1 deletion
diff --git a/‎Cargo.lock‎
Lines changed: 1 addition & 0 deletions b/‎Cargo.lock‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎Cargo.toml‎
Lines changed: 8 additions & 1 deletion b/‎Cargo.toml‎
Lines changed: 8 additions & 1 deletion
diff --git a/‎examples/dqn_cartpole.rs‎
Lines changed: 25 additions & 10 deletions b/‎examples/dqn_cartpole.rs‎
Lines changed: 25 additions & 10 deletions
diff --git a/‎examples/dqn_gridworld.rs‎
Lines changed: 21 additions & 9 deletions b/‎examples/dqn_gridworld.rs‎
Lines changed: 21 additions & 9 deletions
diff --git a/‎examples/dqn_mountaincar.rs‎
Lines changed: 21 additions & 9 deletions b/‎examples/dqn_mountaincar.rs‎
Lines changed: 21 additions & 9 deletions
diff --git a/‎examples/dqn_probe1.rs‎
Lines changed: 22 additions & 9 deletions b/‎examples/dqn_probe1.rs‎
Lines changed: 22 additions & 9 deletions
diff --git a/‎examples/dqn_probe2.rs‎
Lines changed: 24 additions & 9 deletions b/‎examples/dqn_probe2.rs‎
Lines changed: 24 additions & 9 deletions
@@ -1,6 +1,12 @@
 name: Coverage
 
-on: [pull_request, push]
+on: 
+  pull_request:
+    branches:
+      - main
+  push:
+    branches:
+      - main
 
 jobs:
   coverage:
@@ -9,15 +15,17 @@ jobs:
       CARGO_TERM_COLOR: always
     steps:
       - uses: actions/checkout@v4
+      - name: Install system deps
+        run: sudo apt install pkg-config libfreetype6-dev libfontconfig1-dev -y
       - name: Install Rust
         run: rustup update stable
       - name: Install cargo-llvm-cov
         uses: taiki-e/install-action@cargo-llvm-cov
       - name: Generate code coverage
-        run: cargo llvm-cov --all-features --workspace --lcov --output-path lcov.info
+        run: cargo llvm-cov --workspace --lcov --output-path lcov.info
       - name: Upload coverage to Codecov
         uses: codecov/codecov-action@v3
         with:
           token: ${{ secrets.CODECOV_TOKEN }}
           files: lcov.info
-          fail_ci_if_error: true
+          fail_ci_if_error: true
@@ -1,13 +1,21 @@
 name: Continuous Integration
 
-on: [push, pull_request]
+on: 
+  pull_request:
+    branches:
+      - main
+  push:
+    branches:
+      - main
 
 jobs:
   build_and_test:
     runs-on: ubuntu-latest
 
     steps:
       - uses: actions/checkout@v2
+      - name: Install system deps
+        run: sudo apt install pkg-config libfreetype6-dev libfontconfig1-dev -y
       - name: ⚡ Cache
         uses: actions/cache@v4
         with:
 
@@ -3,9 +3,16 @@ name = "sb3-burn"
 version = "0.1.0"
 edition = "2021"
 
+[features]
+default = ["ndarray", "wgpu", "sb3-tch"]
+sb3-tch = ["burn/tch", "tch"]
+ndarray = ["burn/ndarray"]
+wgpu = ["burn/wgpu"]
+
 [dependencies]
 assert_approx_eq = "1.1.0"
-burn = { version = "0.19.0", features = ["ndarray", "wgpu", "autodiff", "train", "tch"]}
+burn = { version = "0.19.0", features = ["autodiff", "train"]}
+tch = {version="0.22.0", optional=true}
 csv = "1.3.0"
 dyn-clone = "1.0.17"
 indicatif = "0.17.8"
 
@@ -1,10 +1,6 @@
 use std::path::PathBuf;
 
-use burn::{
-    backend::{libtorch::LibTorchDevice, Autodiff, LibTorch},
-    grad_clipping::GradientClippingConfig,
-    optim::AdamConfig,
-};
+use burn::{backend::Autodiff, grad_clipping::GradientClippingConfig, optim::AdamConfig};
 use sb3_burn::{
     common::{
         algorithm::{OfflineAlgParams, OfflineTrainer},
@@ -17,16 +13,35 @@ use sb3_burn::{
     env::{base::Env, classic_control::cartpole::CartpoleEnv},
 };
 
+#[cfg(feature = "sb3-tch")]
+use burn::backend::{libtorch::LibTorchDevice, LibTorch};
+#[cfg(not(feature = "sb3-tch"))]
+use burn::backend::{wgpu::WgpuDevice, Wgpu};
+
+#[cfg(not(feature = "sb3-tch"))]
+type B = Autodiff<Wgpu>;
+#[cfg(feature = "sb3-tch")]
+type B = Autodiff<LibTorch>;
+
 extern crate sb3_burn;
 
 fn main() {
     // Using parameters from:
     // https://github.com/DLR-RM/rl-baselines3-zoo/blob/master/hyperparams/dqn.yml
 
-    type TrainDevice = Autodiff<LibTorch>;
-    let train_device = LibTorchDevice::Cuda(0);
+    #[cfg(feature = "sb3-tch")]
+    let train_device = if tch::utils::has_cuda() {
+        println!("Using LibTorch (GPU)");
+        LibTorchDevice::Cuda(0)
+    } else {
+        println!("Using LibTorch (CPU)");
+        LibTorchDevice::Cpu
+    };
+
+    #[cfg(not(feature = "sb3-tch"))]
+    let train_device = WgpuDevice::default();
 
-    sb3_seed::<TrainDevice>(1234, &train_device);
+    sb3_seed::<B>(1234, &train_device);
 
     let config_optimizer =
         AdamConfig::new().with_grad_clipping(Some(GradientClippingConfig::Norm(10.0)));
@@ -46,7 +61,7 @@ fn main() {
         .with_train_every(256);
 
     let env = CartpoleEnv::new(500);
-    let q: LinearAdvDQNNet<TrainDevice> = LinearAdvDQNNet::init(
+    let q: LinearAdvDQNNet<B> = LinearAdvDQNNet::init(
         &train_device,
         env.observation_space().shape().len(),
         env.action_space().shape(),
@@ -86,7 +101,7 @@ fn main() {
         buffer,
         Box::new(logger),
         None,
-        EvalConfig::new().with_n_eval_episodes(100),
+        EvalConfig::new().with_n_eval_episodes(5),
         &train_device,
     );
 
 
@@ -1,10 +1,6 @@
 use std::path::PathBuf;
 
-use burn::{
-    backend::{libtorch::LibTorchDevice, Autodiff, LibTorch},
-    grad_clipping::GradientClippingConfig,
-    optim::AdamConfig,
-};
+use burn::{backend::Autodiff, grad_clipping::GradientClippingConfig, optim::AdamConfig};
 use sb3_burn::{
     common::{
         algorithm::{OfflineAlgParams, OfflineTrainer},
@@ -17,17 +13,33 @@ use sb3_burn::{
     env::{base::Env, gridworld::GridWorldEnv},
 };
 
+#[cfg(feature = "sb3-tch")]
+use burn::backend::{libtorch::LibTorchDevice, LibTorch};
+#[cfg(not(feature = "sb3-tch"))]
+use burn::backend::{wgpu::WgpuDevice, Wgpu};
+
+#[cfg(not(feature = "sb3-tch"))]
+type B = Autodiff<Wgpu>;
+#[cfg(feature = "sb3-tch")]
+type B = Autodiff<LibTorch>;
+
 extern crate sb3_burn;
 
 fn main() {
     // Using parameters from:
     // https://github.com/DLR-RM/rl-baselines3-zoo/blob/master/hyperparams/dqn.yml
 
-    type TrainingBacked = Autodiff<LibTorch>;
+    #[cfg(feature = "sb3-tch")]
+    let train_device = if tch::utils::has_cuda() {
+        LibTorchDevice::Cuda(0)
+    } else {
+        LibTorchDevice::Cpu
+    };
 
-    let train_device = LibTorchDevice::Cuda(0);
+    #[cfg(not(feature = "sb3-tch"))]
+    let train_device = WgpuDevice::default();
 
-    sb3_seed::<TrainingBacked>(1234, &train_device);
+    sb3_seed::<B>(1234, &train_device);
 
     let config_optimizer =
         AdamConfig::new().with_grad_clipping(Some(GradientClippingConfig::Norm(10.0)));
@@ -40,7 +52,7 @@ fn main() {
         .with_lr(1e-3);
 
     let env = GridWorldEnv::default();
-    let q = LinearAdvDQNNet::<TrainingBacked>::init(
+    let q = LinearAdvDQNNet::<B>::init(
         &train_device,
         env.observation_space().shape().len(),
         env.action_space().shape(),
 
@@ -1,10 +1,6 @@
 use std::path::PathBuf;
 
-use burn::{
-    backend::{libtorch::LibTorchDevice, Autodiff, LibTorch},
-    grad_clipping::GradientClippingConfig,
-    optim::AdamConfig,
-};
+use burn::{backend::Autodiff, grad_clipping::GradientClippingConfig, optim::AdamConfig};
 use sb3_burn::{
     common::{
         algorithm::{OfflineAlgParams, OfflineTrainer},
@@ -17,17 +13,33 @@ use sb3_burn::{
     env::{base::Env, classic_control::mountain_car::MountainCarEnv},
 };
 
+#[cfg(feature = "sb3-tch")]
+use burn::backend::{libtorch::LibTorchDevice, LibTorch};
+#[cfg(not(feature = "sb3-tch"))]
+use burn::backend::{wgpu::WgpuDevice, Wgpu};
+
+#[cfg(not(feature = "sb3-tch"))]
+type B = Autodiff<Wgpu>;
+#[cfg(feature = "sb3-tch")]
+type B = Autodiff<LibTorch>;
+
 extern crate sb3_burn;
 
 fn main() {
     // Using parameters from:
     // https://github.com/DLR-RM/rl-baselines3-zoo/blob/master/hyperparams/dqn.yml
 
-    type TrainingBacked = Autodiff<LibTorch>;
+    #[cfg(feature = "sb3-tch")]
+    let train_device = if tch::utils::has_cuda() {
+        LibTorchDevice::Cuda(0)
+    } else {
+        LibTorchDevice::Cpu
+    };
 
-    let train_device = LibTorchDevice::Cuda(0);
+    #[cfg(not(feature = "sb3-tch"))]
+    let train_device = WgpuDevice::default();
 
-    sb3_seed::<TrainingBacked>(1234, &train_device);
+    sb3_seed::<B>(1234, &train_device);
 
     let config_optimizer =
         AdamConfig::new().with_grad_clipping(Some(GradientClippingConfig::Norm(10.0)));
@@ -46,7 +58,7 @@ fn main() {
         .with_train_every(16);
 
     let env = MountainCarEnv::default();
-    let q = LinearAdvDQNNet::<TrainingBacked>::init(
+    let q = LinearAdvDQNNet::<B>::init(
         &train_device,
         env.observation_space().shape().len(),
         env.action_space().shape(),
 
@@ -1,10 +1,6 @@
 use std::path::PathBuf;
 
-use burn::{
-    backend::{libtorch::LibTorchDevice, Autodiff, LibTorch},
-    grad_clipping::GradientClippingConfig,
-    optim::AdamConfig,
-};
+use burn::{backend::Autodiff, grad_clipping::GradientClippingConfig, optim::AdamConfig};
 use sb3_burn::{
     common::{
         algorithm::{OfflineAlgParams, OfflineTrainer},
@@ -17,16 +13,33 @@ use sb3_burn::{
     env::{base::Env, probe::ProbeEnvValueTest},
 };
 
+#[cfg(feature = "sb3-tch")]
+use burn::backend::{libtorch::LibTorchDevice, LibTorch};
+#[cfg(not(feature = "sb3-tch"))]
+use burn::backend::{wgpu::WgpuDevice, Wgpu};
+
+#[cfg(not(feature = "sb3-tch"))]
+type B = Autodiff<Wgpu>;
+#[cfg(feature = "sb3-tch")]
+type B = Autodiff<LibTorch>;
+
 extern crate sb3_burn;
 
 fn main() {
     // Using parameters from:
     // https://github.com/DLR-RM/rl-baselines3-zoo/blob/master/hyperparams/dqn.yml
 
-    type TrainBackend = Autodiff<LibTorch>;
-    let train_device = LibTorchDevice::default();
+    #[cfg(feature = "sb3-tch")]
+    let train_device = if tch::utils::has_cuda() {
+        LibTorchDevice::Cuda(0)
+    } else {
+        LibTorchDevice::Cpu
+    };
+
+    #[cfg(not(feature = "sb3-tch"))]
+    let train_device = WgpuDevice::default();
 
-    sb3_seed::<TrainBackend>(1234, &train_device);
+    sb3_seed::<B>(1234, &train_device);
 
     let config_optimizer =
         AdamConfig::new().with_grad_clipping(Some(GradientClippingConfig::Norm(10.0)));
@@ -42,7 +55,7 @@ fn main() {
         .with_evaluate_during_training(false);
 
     let env = ProbeEnvValueTest::default();
-    let q: LinearDQNNet<TrainBackend> = LinearDQNNet::init(
+    let q: LinearDQNNet<B> = LinearDQNNet::init(
         &train_device,
         env.observation_space().shape().len(),
         env.action_space().shape(),
 
@@ -1,10 +1,6 @@
 use std::path::PathBuf;
 
-use burn::{
-    backend::{libtorch::LibTorchDevice, Autodiff, LibTorch},
-    grad_clipping::GradientClippingConfig,
-    optim::AdamConfig,
-};
+use burn::{backend::Autodiff, grad_clipping::GradientClippingConfig, optim::AdamConfig};
 use sb3_burn::{
     common::{
         algorithm::{OfflineAlgParams, OfflineTrainer},
@@ -17,14 +13,33 @@ use sb3_burn::{
     env::{base::Env, probe::ProbeEnvBackpropTest},
 };
 
+#[cfg(feature = "sb3-tch")]
+use burn::backend::{libtorch::LibTorchDevice, LibTorch};
+#[cfg(not(feature = "sb3-tch"))]
+use burn::backend::{wgpu::WgpuDevice, Wgpu};
+
+#[cfg(not(feature = "sb3-tch"))]
+type B = Autodiff<Wgpu>;
+#[cfg(feature = "sb3-tch")]
+type B = Autodiff<LibTorch>;
+
 extern crate sb3_burn;
 
 fn main() {
     // Using parameters from:
     // https://github.com/DLR-RM/rl-baselines3-zoo/blob/master/hyperparams/dqn.yml
-    type TrainBackend = Autodiff<LibTorch>;
-    let train_device = LibTorchDevice::default();
-    sb3_seed::<TrainBackend>(1234, &train_device);
+
+    #[cfg(feature = "sb3-tch")]
+    let train_device = if tch::utils::has_cuda() {
+        LibTorchDevice::Cuda(0)
+    } else {
+        LibTorchDevice::Cpu
+    };
+
+    #[cfg(not(feature = "sb3-tch"))]
+    let train_device = WgpuDevice::default();
+
+    sb3_seed::<B>(1234, &train_device);
 
     let config_optimizer =
         AdamConfig::new().with_grad_clipping(Some(GradientClippingConfig::Norm(10.0)));
@@ -40,7 +55,7 @@ fn main() {
         .with_evaluate_during_training(false);
 
     let env = ProbeEnvBackpropTest::default();
-    let q: LinearDQNNet<TrainBackend> = LinearDQNNet::init(
+    let q: LinearDQNNet<B> = LinearDQNNet::init(
         &train_device,
         env.observation_space().shape(),
         env.action_space().shape(),