diff --git a/burn-book/src/advanced/backend-extension/custom-wgpu-kernel.md b/burn-book/src/advanced/backend-extension/custom-wgpu-kernel.md index f82054bbfc..e494dcd2fd 100644 --- a/burn-book/src/advanced/backend-extension/custom-wgpu-kernel.md +++ b/burn-book/src/advanced/backend-extension/custom-wgpu-kernel.md @@ -194,7 +194,7 @@ impl DynamicKernel for FusedMatmulAddRelu { ``` Subsequently, we'll go into implementing our custom backend trait for the WGPU backend. -Note that we won't go into supporting the `fusion` feature flag in this tutorial, so +Note that we won't go into supporting the `fusion` feature flag in this tutorial, so we implement the trait for the raw `WgpuBackend` type. ```rust, ignore diff --git a/burn-book/src/basic-workflow/data.md b/burn-book/src/basic-workflow/data.md index 44a778143c..01e8701fc4 100644 --- a/burn-book/src/basic-workflow/data.md +++ b/burn-book/src/basic-workflow/data.md @@ -16,15 +16,15 @@ at `examples/guide/` [directory](https://github.com/tracel-ai/burn/tree/main/exa ```rust , ignore use burn::{ - data::{dataloader::batcher::Batcher, dataset::vision::MNISTItem}, + data::{dataloader::batcher::Batcher, dataset::vision::MnistItem}, tensor::{backend::Backend, Data, ElementConversion, Int, Tensor}, }; -pub struct MNISTBatcher { +pub struct MnistBatcher { device: B::Device, } -impl MNISTBatcher { +impl MnistBatcher { pub fn new(device: B::Device) -> Self { Self { device } } @@ -42,13 +42,13 @@ Next, we need to actually implement the batching logic. ```rust , ignore #[derive(Clone, Debug)] -pub struct MNISTBatch { +pub struct MnistBatch { pub images: Tensor, pub targets: Tensor, } -impl Batcher> for MNISTBatcher { - fn batch(&self, items: Vec) -> MNISTBatch { +impl Batcher> for MnistBatcher { + fn batch(&self, items: Vec) -> MnistBatch { let images = items .iter() .map(|item| Data::::from(item.image)) @@ -71,7 +71,7 @@ impl Batcher> for MNISTBatcher { let images = Tensor::cat(images, 0).to_device(&self.device); let targets = Tensor::cat(targets, 0).to_device(&self.device); - MNISTBatch { images, targets } + MnistBatch { images, targets } } } ``` @@ -81,7 +81,7 @@ impl Batcher> for MNISTBatcher { The iterator pattern allows you to perform some tasks on a sequence of items in turn. -In this example, an iterator is created over the `MNISTItem`s in the vector `items` by calling the +In this example, an iterator is created over the `MnistItem`s in the vector `items` by calling the `iter` method. _Iterator adaptors_ are methods defined on the `Iterator` trait that produce different iterators by @@ -100,7 +100,7 @@ If we go back to the example, we can break down and comment the expression used images. ```rust, ignore -let images = items // take items Vec +let images = items // take items Vec .iter() // create an iterator over it .map(|item| Data::::from(item.image)) // for each item, convert the image to float32 data struct .map(|data| Tensor::::from_data(data.convert(), &self.device)) // for each data struct, create a tensor on the device @@ -115,8 +115,8 @@ Book.
-In the previous example, we implement the `Batcher` trait with a list of `MNISTItem` as input and a -single `MNISTBatch` as output. The batch contains the images in the form of a 3D tensor, along with +In the previous example, we implement the `Batcher` trait with a list of `MnistItem` as input and a +single `MnistBatch` as output. The batch contains the images in the form of a 3D tensor, along with a targets tensor that contains the indexes of the correct digit class. The first step is to parse the image array into a `Data` struct. Burn provides the `Data` struct to encapsulate tensor storage information without being specific for a backend. When creating a tensor from data, we often need to diff --git a/burn-book/src/basic-workflow/inference.md b/burn-book/src/basic-workflow/inference.md index 40851192b6..ad2a893ea7 100644 --- a/burn-book/src/basic-workflow/inference.md +++ b/burn-book/src/basic-workflow/inference.md @@ -16,7 +16,7 @@ impl ModelConfig { conv1: Conv2dConfig::new([1, 8], [3, 3]).init_with(record.conv1), conv2: Conv2dConfig::new([8, 16], [3, 3]).init_with(record.conv2), pool: AdaptiveAvgPool2dConfig::new([8, 8]).init(), - activation: ReLU::new(), + activation: Relu::new(), linear1: LinearConfig::new(16 * 8 * 8, self.hidden_size).init_with(record.linear1), linear2: LinearConfig::new(self.hidden_size, self.num_classes) .init_with(record.linear2), @@ -33,7 +33,7 @@ manually. Everything is validated when loading the model with the record. Now let's create a simple `infer` method in a new file `src/inference.rs` which we will use to load our trained model. ```rust , ignore -pub fn infer(artifact_dir: &str, device: B::Device, item: MNISTItem) { +pub fn infer(artifact_dir: &str, device: B::Device, item: MnistItem) { let config = TrainingConfig::load(format!("{artifact_dir}/config.json")) .expect("Config should exist for the model"); let record = CompactRecorder::new() @@ -43,7 +43,7 @@ pub fn infer(artifact_dir: &str, device: B::Device, item: MNISTItem) let model = config.model.init_with::(record); let label = item.label; - let batcher = MNISTBatcher::new(device); + let batcher = MnistBatcher::new(device); let batch = batcher.batch(vec![item]); let output = model.forward(batch.images); let predicted = output.argmax(1).flatten::<1>(0, 1).into_scalar(); @@ -56,6 +56,6 @@ The first step is to load the configuration of the training to fetch the correct configuration. Then we can fetch the record using the same recorder as we used during training. Finally we can init the model with the configuration and the record before sending it to the wanted device for inference. For simplicity we can use the same batcher used during the training to pass -from a MNISTItem to a tensor. +from a MnistItem to a tensor. By running the infer function, you should see the predictions of your model! diff --git a/burn-book/src/basic-workflow/model.md b/burn-book/src/basic-workflow/model.md index 90092a4e80..381f2a5d2f 100644 --- a/burn-book/src/basic-workflow/model.md +++ b/burn-book/src/basic-workflow/model.md @@ -35,7 +35,7 @@ use burn::{ nn::{ conv::{Conv2d, Conv2dConfig}, pool::{AdaptiveAvgPool2d, AdaptiveAvgPool2dConfig}, - Dropout, DropoutConfig, Linear, LinearConfig, ReLU, + Dropout, DropoutConfig, Linear, LinearConfig, Relu, }, tensor::{backend::Backend, Tensor}, }; @@ -48,7 +48,7 @@ pub struct Model { dropout: Dropout, linear1: Linear, linear2: Linear, - activation: ReLU, + activation: Relu, } ``` @@ -98,7 +98,7 @@ There are two major things going on in this code sample. pub struct MyCustomModule { linear1: Linear, linear2: Linear, - activation: ReLU, + activation: Relu, } ``` @@ -178,7 +178,7 @@ impl ModelConfig { conv1: Conv2dConfig::new([1, 8], [3, 3]).init(device), conv2: Conv2dConfig::new([8, 16], [3, 3]).init(device), pool: AdaptiveAvgPool2dConfig::new([8, 8]).init(), - activation: ReLU::new(), + activation: Relu::new(), linear1: LinearConfig::new(16 * 8 * 8, self.hidden_size).init(device), linear2: LinearConfig::new(self.hidden_size, self.num_classes).init(device), dropout: DropoutConfig::new(self.dropout).init(), diff --git a/burn-book/src/basic-workflow/training.md b/burn-book/src/basic-workflow/training.md index afedafdc8a..a015fb2b88 100644 --- a/burn-book/src/basic-workflow/training.md +++ b/burn-book/src/basic-workflow/training.md @@ -43,23 +43,23 @@ Moving forward, we will proceed with the implementation of both the training and for our model. ```rust , ignore -impl TrainStep, ClassificationOutput> for Model { - fn step(&self, batch: MNISTBatch) -> TrainOutput> { +impl TrainStep, ClassificationOutput> for Model { + fn step(&self, batch: MnistBatch) -> TrainOutput> { let item = self.forward_classification(batch.images, batch.targets); TrainOutput::new(self, item.loss.backward(), item) } } -impl ValidStep, ClassificationOutput> for Model { - fn step(&self, batch: MNISTBatch) -> ClassificationOutput { +impl ValidStep, ClassificationOutput> for Model { + fn step(&self, batch: MnistBatch) -> ClassificationOutput { self.forward_classification(batch.images, batch.targets) } } ``` Here we define the input and output types as generic arguments in the `TrainStep` and `ValidStep`. -We will call them `MNISTBatch` and `ClassificationOutput`. In the training step, the computation of +We will call them `MnistBatch` and `ClassificationOutput`. In the training step, the computation of gradients is straightforward, necessitating a simple invocation of `backward()` on the loss. Note that contrary to PyTorch, gradients are not stored alongside each tensor parameter, but are rather returned by the backward pass, as such: `let gradients = loss.backward();`. The gradient of a @@ -81,8 +81,8 @@ which is generic over the `Backend` trait as has been covered before. These trai `burn::train` and define a common `step` method that should be implemented for all structs. Since the trait is generic over the input and output types, the trait implementation must specify the concrete types used. This is where the additional type constraints appear -`, ClassificationOutput>`. As we saw previously, the concrete input type for the -batch is `MNISTBatch`, and the output of the forward pass is `ClassificationOutput`. The `step` +`, ClassificationOutput>`. As we saw previously, the concrete input type for the +batch is `MnistBatch`, and the output of the forward pass is `ClassificationOutput`. The `step` method signature matches the concrete input and output types. For more details specific to constraints on generic types when defining methods, take a look at @@ -118,20 +118,20 @@ pub fn train(artifact_dir: &str, config: TrainingConfig, dev B::seed(config.seed); - let batcher_train = MNISTBatcher::::new(device.clone()); - let batcher_valid = MNISTBatcher::::new(device.clone()); + let batcher_train = MnistBatcher::::new(device.clone()); + let batcher_valid = MnistBatcher::::new(device.clone()); let dataloader_train = DataLoaderBuilder::new(batcher_train) .batch_size(config.batch_size) .shuffle(config.seed) .num_workers(config.num_workers) - .build(MNISTDataset::train()); + .build(MnistDataset::train()); let dataloader_test = DataLoaderBuilder::new(batcher_valid) .batch_size(config.batch_size) .shuffle(config.seed) .num_workers(config.num_workers) - .build(MNISTDataset::test()); + .build(MnistDataset::test()); let learner = LearnerBuilder::new(artifact_dir) .metric_train_numeric(AccuracyMetric::new()) diff --git a/burn-book/src/building-blocks/module.md b/burn-book/src/building-blocks/module.md index 1a95813f1e..6a577eb741 100644 --- a/burn-book/src/building-blocks/module.md +++ b/burn-book/src/building-blocks/module.md @@ -160,4 +160,4 @@ Burn comes with built-in modules that you can use to build your own modules. | Burn API | PyTorch Equivalent | | ------------------ | --------------------- | | `CrossEntropyLoss` | `nn.CrossEntropyLoss` | -| `MSELoss` | `nn.MSELoss` | +| `MseLoss` | `nn.MSELoss` | diff --git a/burn-book/src/custom-training-loop.md b/burn-book/src/custom-training-loop.md index 95682987ec..246088eba3 100644 --- a/burn-book/src/custom-training-loop.md +++ b/burn-book/src/custom-training-loop.md @@ -40,21 +40,21 @@ pub fn run(device: &B::Device) { let mut optim = config.optimizer.init(); // Create the batcher. - let batcher_train = MNISTBatcher::::new(device.clone()); - let batcher_valid = MNISTBatcher::::new(device.clone()); + let batcher_train = MnistBatcher::::new(device.clone()); + let batcher_valid = MnistBatcher::::new(device.clone()); // Create the dataloaders. let dataloader_train = DataLoaderBuilder::new(batcher_train) .batch_size(config.batch_size) .shuffle(config.seed) .num_workers(config.num_workers) - .build(MNISTDataset::train()); + .build(MnistDataset::train()); let dataloader_test = DataLoaderBuilder::new(batcher_valid) .batch_size(config.batch_size) .shuffle(config.seed) .num_workers(config.num_workers) - .build(MNISTDataset::test()); + .build(MnistDataset::test()); ... } @@ -140,7 +140,7 @@ Note that after each epoch, we include a validation loop to assess our model's p previously unseen data. To disable gradient tracking during this validation step, we can invoke `model.valid()`, which provides a model on the inner backend without autodiff capabilities. It's important to emphasize that we've declared our validation batcher to be on the inner backend, -specifically `MNISTBatcher`; not using `model.valid()` will result in a compilation +specifically `MnistBatcher`; not using `model.valid()` will result in a compilation error. You can find the code above available as an @@ -195,7 +195,7 @@ where M: AutodiffModule, O: Optimizer, { - pub fn step(&mut self, _batch: MNISTBatch) { + pub fn step(&mut self, _batch: MnistBatch) { // } } @@ -214,7 +214,7 @@ the backend and add your trait constraint within its definition: ```rust, ignore #[allow(dead_code)] impl Learner2 { - pub fn step(&mut self, _batch: MNISTBatch) + pub fn step(&mut self, _batch: MnistBatch) where B: AutodiffBackend, M: AutodiffModule, diff --git a/burn-book/src/saving-and-loading.md b/burn-book/src/saving-and-loading.md index 5b784ab50d..d3fdf3b7dc 100644 --- a/burn-book/src/saving-and-loading.md +++ b/burn-book/src/saving-and-loading.md @@ -44,7 +44,7 @@ model definition as a simple example. pub struct Model { linear_in: Linear, linear_out: Linear, - activation: ReLU, + activation: Relu, } ``` @@ -59,7 +59,7 @@ impl Model { Model { linear_in: LinearConfig::new(10, 64).init_with(record.linear_in), linear_out: LinearConfig::new(64, 2).init_with(record.linear_out), - activation: ReLU::new(), + activation: Relu::new(), } } @@ -70,7 +70,7 @@ impl Model { Model { linear_in: l1, linear_out: l2, - activation: ReLU::new(), + activation: Relu::new(), } } } diff --git a/burn-core/src/nn/loss/mse.rs b/burn-core/src/nn/loss/mse.rs index e99e69c376..00945d004b 100644 --- a/burn-core/src/nn/loss/mse.rs +++ b/burn-core/src/nn/loss/mse.rs @@ -5,17 +5,17 @@ use burn_tensor::{backend::Backend, Tensor}; /// Calculate the mean squared error loss from the input logits and the targets. #[derive(Clone, Debug)] -pub struct MSELoss { +pub struct MseLoss { backend: PhantomData, } -impl Default for MSELoss { +impl Default for MseLoss { fn default() -> Self { Self::new() } } -impl MSELoss { +impl MseLoss { /// Create the criterion. pub fn new() -> Self { Self { @@ -67,7 +67,7 @@ mod tests { let targets = Tensor::::from_data(Data::from([[2.0, 1.0], [3.0, 2.0]]), &device); - let mse = MSELoss::new(); + let mse = MseLoss::new(); let loss_no_reduction = mse.forward_no_reduction(logits.clone(), targets.clone()); let loss = mse.forward(logits.clone(), targets.clone(), Reduction::Auto); let loss_sum = mse.forward(logits, targets, Reduction::Sum); diff --git a/burn-core/src/nn/relu.rs b/burn-core/src/nn/relu.rs index 92e260c7ee..bd8c92a4dd 100644 --- a/burn-core/src/nn/relu.rs +++ b/burn-core/src/nn/relu.rs @@ -8,9 +8,9 @@ use crate::tensor::Tensor; /// /// `y = max(0, x)` #[derive(Module, Clone, Debug, Default)] -pub struct ReLU {} +pub struct Relu {} -impl ReLU { +impl Relu { /// Create the module. pub fn new() -> Self { Self {} diff --git a/burn-core/src/optim/adagrad.rs b/burn-core/src/optim/adagrad.rs index ab528c211d..20edc3291a 100644 --- a/burn-core/src/optim/adagrad.rs +++ b/burn-core/src/optim/adagrad.rs @@ -27,14 +27,14 @@ pub struct AdaGradConfig { /// AdaGrad optimizer pub struct AdaGrad { - lr_decay: LRDecay, + lr_decay: LrDecay, weight_decay: Option>, } /// AdaGrad state. #[derive(Record, Clone, new)] pub struct AdaGradState { - lr_decay: LRDecayState, + lr_decay: LrDecayState, } impl SimpleOptimizer for AdaGrad { @@ -81,7 +81,7 @@ impl AdaGradConfig { /// Returns an optimizer that can be used to optimize a module. pub fn init>(&self) -> impl Optimizer { let optim = AdaGrad { - lr_decay: LRDecay { + lr_decay: LrDecay { lr_decay: self.lr_decay, epsilon: self.epsilon, }, @@ -98,29 +98,29 @@ impl AdaGradConfig { /// Learning rate decay state (also includes sum state). #[derive(Record, new, Clone)] -pub struct LRDecayState { +pub struct LrDecayState { time: usize, sum: Tensor, } -struct LRDecay { +struct LrDecay { lr_decay: f64, epsilon: f32, } -impl LRDecay { +impl LrDecay { pub fn transform( &self, grad: Tensor, lr: LearningRate, - lr_decay_state: Option>, - ) -> (Tensor, LRDecayState) { + lr_decay_state: Option>, + ) -> (Tensor, LrDecayState) { let state = if let Some(mut state) = lr_decay_state { state.sum = state.sum.add(grad.clone().powf_scalar(2.)); state.time += 1; state } else { - LRDecayState::new(1, grad.clone().powf_scalar(2.)) + LrDecayState::new(1, grad.clone().powf_scalar(2.)) }; let new_lr = lr / (1. + (state.time as f64 - 1.) * self.lr_decay); @@ -133,7 +133,7 @@ impl LRDecay { } } -impl LRDecayState { +impl LrDecayState { /// Move state to device. /// /// # Arguments @@ -278,7 +278,7 @@ mod tests { { let config = AdaGradConfig::new(); AdaGrad { - lr_decay: LRDecay { + lr_decay: LrDecay { lr_decay: config.lr_decay, epsilon: config.epsilon, }, diff --git a/burn-core/src/optim/rmsprop.rs b/burn-core/src/optim/rmsprop.rs index 11b36ea94c..fd6d2e6837 100644 --- a/burn-core/src/optim/rmsprop.rs +++ b/burn-core/src/optim/rmsprop.rs @@ -12,19 +12,19 @@ use crate::optim::adaptor::OptimizerAdaptor; use crate::tensor::{backend::AutodiffBackend, Tensor}; use burn_tensor::backend::Backend; -/// Configuration to create the [RMSProp](RMSProp) optimizer. +/// Configuration to create the [RmsProp](RmsProp) optimizer. #[derive(Config)] -pub struct RMSPropConfig { +pub struct RmsPropConfig { /// Smoothing constant. #[config(default = 0.99)] alpha: f32, - /// momentum for RMSProp. + /// momentum for RmsProp. #[config(default = 0.9)] momentum: f32, /// A value required for numerical stability. #[config(default = 1e-5)] epsilon: f32, - /// if True, compute the centered RMSProp, the gradient is normalized by an estimation of its variance + /// if True, compute the centered RmsProp, the gradient is normalized by an estimation of its variance #[config(default = false)] centered: bool, /// [Weight decay](WeightDecayConfig) config. @@ -33,22 +33,22 @@ pub struct RMSPropConfig { grad_clipping: Option, } -impl RMSPropConfig { - /// Initialize RMSProp optimizer. +impl RmsPropConfig { + /// Initialize RmsProp optimizer. /// /// # Returns /// /// Returns an optimizer that can be used to optimize a module. pub fn init>( &self, - ) -> OptimizerAdaptor, M, B> { + ) -> OptimizerAdaptor, M, B> { let weight_decay = self.weight_decay.as_ref().map(WeightDecay::new); - let mut optim = OptimizerAdaptor::from(RMSProp { + let mut optim = OptimizerAdaptor::from(RmsProp { alpha: self.alpha, centered: self.centered, weight_decay, - momentum: RMSPropMomentum { + momentum: RmsPropMomentum { momentum: self.momentum, epsilon: self.epsilon, }, @@ -63,18 +63,18 @@ impl RMSPropConfig { } /// Optimizer that implements stochastic gradient descent with momentum. -/// The optimizer can be configured with [RMSPropConfig](RMSPropConfig). -pub struct RMSProp { +/// The optimizer can be configured with [RmsPropConfig](RmsPropConfig). +pub struct RmsProp { alpha: f32, // epsilon: f32, centered: bool, // momentum: Option>, - momentum: RMSPropMomentum, + momentum: RmsPropMomentum, weight_decay: Option>, } -impl SimpleOptimizer for RMSProp { - type State = RMSPropState; +impl SimpleOptimizer for RmsProp { + type State = RmsPropState; fn step( &self, @@ -117,7 +117,7 @@ impl SimpleOptimizer for RMSProp { .transform(grad, state_centered, state_momentum); // transition state - let state = RMSPropState::new(state_square_avg, state_centered, state_momentum); + let state = RmsPropState::new(state_square_avg, state_centered, state_momentum); // tensor param transform let delta = grad.mul_scalar(lr); @@ -135,12 +135,12 @@ impl SimpleOptimizer for RMSProp { } } -/// State of [RMSProp](RMSProp) +/// State of [RmsProp](RmsProp) #[derive(Record, Clone, new)] -pub struct RMSPropState { +pub struct RmsPropState { square_avg: SquareAvgState, centered: CenteredState, - momentum: Option>, + momentum: Option>, } /// [SquareAvgState](SquareAvgState) is to store and pass optimizer step params. @@ -249,24 +249,24 @@ impl CenteredState { } } -/// [RMSPropMomentum](RMSPropMomentum) is to store config status for optimizer. -/// (, which is stored in [optimizer](RMSProp) itself and not passed in during `step()` calculation) -pub struct RMSPropMomentum { +/// [RmsPropMomentum](RmsPropMomentum) is to store config status for optimizer. +/// (, which is stored in [optimizer](RmsProp) itself and not passed in during `step()` calculation) +pub struct RmsPropMomentum { momentum: f32, epsilon: f32, } -impl RMSPropMomentum { - /// transform [grad](Tensor) and [RMSPropMomentumState] to the next step +impl RmsPropMomentum { + /// transform [grad](Tensor) and [RmsPropMomentumState] to the next step fn transform( &self, grad: Tensor, centered_state: CenteredState, - momentum_state: Option>, + momentum_state: Option>, ) -> ( Tensor, CenteredState, - Option>, + Option>, ) { let grad = grad.div(centered_state.avg.clone().sqrt().add_scalar(self.epsilon)); @@ -278,7 +278,7 @@ impl RMSPropMomentum { ( buf.clone(), centered_state, - Some(RMSPropMomentumState { buf }), + Some(RmsPropMomentumState { buf }), ) } else { (grad, centered_state, None) @@ -286,13 +286,13 @@ impl RMSPropMomentum { } } -/// [RMSPropMomentumState](RMSPropMomentumState) is to store and pass optimizer step params. +/// [RmsPropMomentumState](RmsPropMomentumState) is to store and pass optimizer step params. #[derive(Record, Clone, new)] -pub struct RMSPropMomentumState { +pub struct RmsPropMomentumState { buf: Tensor, } -impl RMSPropMomentumState { +impl RmsPropMomentumState { /// Moves the state to a device. /// /// # Arguments @@ -378,7 +378,7 @@ mod tests { ) .require_grad(); - let mut optimizer = RMSPropConfig::new() + let mut optimizer = RmsPropConfig::new() .with_alpha(0.99) .with_epsilon(1e-8) .with_weight_decay(WeightDecayConfig::new(0.05).into()) @@ -453,7 +453,7 @@ mod tests { ) .require_grad(); - let mut optimizer = RMSPropConfig::new() + let mut optimizer = RmsPropConfig::new() .with_alpha(0.99) .with_epsilon(1e-8) .with_weight_decay(WeightDecayConfig::new(0.05).into()) @@ -529,9 +529,9 @@ mod tests { } fn create_rmsprop( - ) -> OptimizerAdaptor, nn::Linear, TestAutodiffBackend> + ) -> OptimizerAdaptor, nn::Linear, TestAutodiffBackend> { - RMSPropConfig { + RmsPropConfig { alpha: 0.99, epsilon: 1e-9, centered: false, diff --git a/burn-dataset/src/source/huggingface/downloader.rs b/burn-dataset/src/source/huggingface/downloader.rs index 9d3ef277dc..9e0c152bdc 100644 --- a/burn-dataset/src/source/huggingface/downloader.rs +++ b/burn-dataset/src/source/huggingface/downloader.rs @@ -49,12 +49,12 @@ pub enum ImporterError { /// use serde::{Deserialize, Serialize}; /// /// #[derive(Deserialize, Debug, Clone)] -/// struct MNISTItemRaw { +/// struct MnistItemRaw { /// pub image_bytes: Vec, /// pub label: usize, /// } /// -/// let train_ds:SqliteDataset = HuggingfaceDatasetLoader::new("mnist") +/// let train_ds:SqliteDataset = HuggingfaceDatasetLoader::new("mnist") /// .dataset("train") /// .unwrap(); pub struct HuggingfaceDatasetLoader { diff --git a/burn-dataset/src/vision/mnist.rs b/burn-dataset/src/vision/mnist.rs index 040442277c..20173f65c5 100644 --- a/burn-dataset/src/vision/mnist.rs +++ b/burn-dataset/src/vision/mnist.rs @@ -24,7 +24,7 @@ const HEIGHT: usize = 28; /// MNIST item. #[derive(Deserialize, Serialize, Debug, Clone)] -pub struct MNISTItem { +pub struct MnistItem { /// Image as a 2D array of floats. pub image: [[f32; WIDTH]; HEIGHT], @@ -33,16 +33,16 @@ pub struct MNISTItem { } #[derive(Deserialize, Debug, Clone)] -struct MNISTItemRaw { +struct MnistItemRaw { pub image_bytes: Vec, pub label: u8, } struct BytesToImage; -impl Mapper for BytesToImage { +impl Mapper for BytesToImage { /// Convert a raw MNIST item (image bytes) to a MNIST item (2D array image). - fn map(&self, item: &MNISTItemRaw) -> MNISTItem { + fn map(&self, item: &MnistItemRaw) -> MnistItem { // Ensure the image dimensions are correct. debug_assert_eq!(item.image_bytes.len(), WIDTH * HEIGHT); @@ -54,25 +54,25 @@ impl Mapper for BytesToImage { image_array[y][x] = *pixel as f32; } - MNISTItem { + MnistItem { image: image_array, label: item.label, } } } -type MappedDataset = MapperDataset, BytesToImage, MNISTItemRaw>; +type MappedDataset = MapperDataset, BytesToImage, MnistItemRaw>; /// The MNIST dataset consists of 70,000 28x28 black-and-white images in 10 classes (one for each digits), with 7,000 /// images per class. There are 60,000 training images and 10,000 test images. /// /// The data is downloaded from the web from the [CVDF mirror](https://github.com/cvdfoundation/mnist). -pub struct MNISTDataset { +pub struct MnistDataset { dataset: MappedDataset, } -impl Dataset for MNISTDataset { - fn get(&self, index: usize) -> Option { +impl Dataset for MnistDataset { + fn get(&self, index: usize) -> Option { self.dataset.get(index) } @@ -81,7 +81,7 @@ impl Dataset for MNISTDataset { } } -impl MNISTDataset { +impl MnistDataset { /// Creates a new train dataset. pub fn train() -> Self { Self::new("train") @@ -94,19 +94,19 @@ impl MNISTDataset { fn new(split: &str) -> Self { // Download dataset - let root = MNISTDataset::download(split); + let root = MnistDataset::download(split); // MNIST is tiny so we can load it in-memory // Train images (u8): 28 * 28 * 60000 = 47.04Mb // Test images (u8): 28 * 28 * 10000 = 7.84Mb - let images = MNISTDataset::read_images(&root, split); - let labels = MNISTDataset::read_labels(&root, split); + let images = MnistDataset::read_images(&root, split); + let labels = MnistDataset::read_labels(&root, split); - // Collect as vector of MNISTItemRaw + // Collect as vector of MnistItemRaw let items: Vec<_> = images .into_iter() .zip(labels) - .map(|(image_bytes, label)| MNISTItemRaw { image_bytes, label }) + .map(|(image_bytes, label)| MnistItemRaw { image_bytes, label }) .collect(); let dataset = InMemDataset::new(items); @@ -132,12 +132,12 @@ impl MNISTDataset { // Download split files match split { "train" => { - MNISTDataset::download_file(TRAIN_IMAGES, &split_dir); - MNISTDataset::download_file(TRAIN_LABELS, &split_dir); + MnistDataset::download_file(TRAIN_IMAGES, &split_dir); + MnistDataset::download_file(TRAIN_LABELS, &split_dir); } "test" => { - MNISTDataset::download_file(TEST_IMAGES, &split_dir); - MNISTDataset::download_file(TEST_LABELS, &split_dir); + MnistDataset::download_file(TEST_IMAGES, &split_dir); + MnistDataset::download_file(TEST_LABELS, &split_dir); } _ => panic!("Invalid split specified {}", split), }; diff --git a/burn-import/pytorch-tests/tests/linear/mod.rs b/burn-import/pytorch-tests/tests/linear/mod.rs index 2864d7b0e0..7dfa05e827 100644 --- a/burn-import/pytorch-tests/tests/linear/mod.rs +++ b/burn-import/pytorch-tests/tests/linear/mod.rs @@ -1,6 +1,6 @@ use burn::{ module::Module, - nn::{Linear, LinearConfig, ReLU}, + nn::{Linear, LinearConfig, Relu}, tensor::{backend::Backend, Tensor}, }; @@ -8,7 +8,7 @@ use burn::{ pub struct Net { fc1: Linear, fc2: Linear, - relu: ReLU, + relu: Relu, } impl Net { @@ -16,7 +16,7 @@ impl Net { pub fn new_with(record: NetRecord) -> Self { let fc1 = LinearConfig::new(2, 3).init_with(record.fc1); let fc2 = LinearConfig::new(3, 4).init_with(record.fc2); - let relu = ReLU::default(); + let relu = Relu::default(); Self { fc1, fc2, relu } } diff --git a/burn-import/src/onnx/from_onnx.rs b/burn-import/src/onnx/from_onnx.rs index 940aba72ad..9c3e9564a2 100644 --- a/burn-import/src/onnx/from_onnx.rs +++ b/burn-import/src/onnx/from_onnx.rs @@ -9,7 +9,7 @@ use crate::onnx::{ proto_conversion::convert_node_proto, }; -use super::ir::{ArgType, Argument, Node, NodeType, ONNXGraph, Tensor}; +use super::ir::{ArgType, Argument, Node, NodeType, OnnxGraph, Tensor}; use super::protos::{ModelProto, TensorProto}; use super::{dim_inference::dim_inference, protos::ValueInfoProto}; @@ -33,14 +33,14 @@ const LIFT_CONSTANTS_FOR_NODE_TYPES: [NodeType; 7] = [ /// /// # Returns /// -/// * `ONNXGraph` - The graph representation of the onnx file +/// * `OnnxGraph` - The graph representation of the onnx file /// /// # Panics /// /// * If the file cannot be opened /// * If the file cannot be parsed /// * If the nodes are not topologically sorted -pub fn parse_onnx(onnx_path: &Path) -> ONNXGraph { +pub fn parse_onnx(onnx_path: &Path) -> OnnxGraph { log::info!("Parsing ONNX file: {}", onnx_path.display()); // Open the file @@ -118,7 +118,7 @@ pub fn parse_onnx(onnx_path: &Path) -> ONNXGraph { log::info!("Finished parsing ONNX file: {}", onnx_path.display()); - ONNXGraph { + OnnxGraph { nodes, inputs, outputs, diff --git a/burn-import/src/onnx/ir.rs b/burn-import/src/onnx/ir.rs index 65f03bc102..be27a70dd7 100644 --- a/burn-import/src/onnx/ir.rs +++ b/burn-import/src/onnx/ir.rs @@ -129,7 +129,7 @@ pub enum Data { /// ONNX graph representation #[derive(Debug, Clone)] -pub struct ONNXGraph { +pub struct OnnxGraph { /// The nodes of the graph. pub nodes: Vec, diff --git a/burn-import/src/onnx/mod.rs b/burn-import/src/onnx/mod.rs index b1f1da971b..b0d14549fb 100644 --- a/burn-import/src/onnx/mod.rs +++ b/burn-import/src/onnx/mod.rs @@ -11,4 +11,4 @@ mod to_burn; pub use to_burn::*; pub use from_onnx::parse_onnx; -pub use ir::ONNXGraph; +pub use ir::OnnxGraph; diff --git a/burn-import/src/onnx/to_burn.rs b/burn-import/src/onnx/to_burn.rs index b0fbfb556f..bd17bf1cd3 100644 --- a/burn-import/src/onnx/to_burn.rs +++ b/burn-import/src/onnx/to_burn.rs @@ -45,7 +45,7 @@ use crate::{ use super::{ from_onnx::parse_onnx, - ir::{self, ArgType, Argument, Data, ElementType, ONNXGraph}, + ir::{self, ArgType, Argument, Data, ElementType, OnnxGraph}, op_configuration::{ avg_pool2d_config, clip_config, concat_config, dropout_config, reshape_config, softmax_config, @@ -218,7 +218,7 @@ impl ModelGen { } } -impl ONNXGraph { +impl OnnxGraph { /// Converts ONNX graph to Burn graph. pub fn into_burn(self) -> BurnGraph { let mut graph = BurnGraph::::default(); diff --git a/burn-no-std-tests/src/mlp.rs b/burn-no-std-tests/src/mlp.rs index 619f676761..db13e06146 100644 --- a/burn-no-std-tests/src/mlp.rs +++ b/burn-no-std-tests/src/mlp.rs @@ -28,7 +28,7 @@ pub struct MlpConfig { pub struct Mlp { linears: Vec>, dropout: nn::Dropout, - activation: nn::ReLU, + activation: nn::Relu, } impl Mlp { @@ -43,7 +43,7 @@ impl Mlp { Self { linears, dropout: nn::DropoutConfig::new(0.3).init(), - activation: nn::ReLU::new(), + activation: nn::Relu::new(), } } diff --git a/burn-train/src/metric/cuda.rs b/burn-train/src/metric/cuda.rs index e69e11ffc1..37d131fdf4 100644 --- a/burn-train/src/metric/cuda.rs +++ b/burn-train/src/metric/cuda.rs @@ -3,11 +3,11 @@ use crate::metric::{Metric, MetricEntry}; use nvml_wrapper::Nvml; /// Track basic cuda infos. -pub struct CUDAMetric { +pub struct CudaMetric { nvml: Option, } -impl CUDAMetric { +impl CudaMetric { /// Creates a new metric for CUDA. pub fn new() -> Self { Self { @@ -19,7 +19,7 @@ impl CUDAMetric { } } -impl Default for CUDAMetric { +impl Default for CudaMetric { fn default() -> Self { Self::new() } @@ -29,7 +29,7 @@ impl Adaptor<()> for T { fn adapt(&self) {} } -impl Metric for CUDAMetric { +impl Metric for CudaMetric { const NAME: &'static str = "CUDA Stats"; type Input = (); diff --git a/burn/src/lib.rs b/burn/src/lib.rs index 64cad0331f..b59716e76c 100644 --- a/burn/src/lib.rs +++ b/burn/src/lib.rs @@ -61,7 +61,7 @@ //! - `audio`: Enables audio datasets (SpeechCommandsDataset) //! - `sqlite`: Stores datasets in SQLite database //! - `sqlite_bundled`: Use bundled version of SQLite -//! - `vision`: Enables vision datasets (MNISTDataset) +//! - `vision`: Enables vision datasets (MnistDataset) //! - Backends //! - `wgpu`: Makes available the WGPU backend //! - `candle`: Makes available the Candle backend diff --git a/examples/custom-image-dataset/src/model.rs b/examples/custom-image-dataset/src/model.rs index 8de1e76084..7abc450db0 100644 --- a/examples/custom-image-dataset/src/model.rs +++ b/examples/custom-image-dataset/src/model.rs @@ -3,7 +3,7 @@ use burn::{ nn::{ conv::{Conv2d, Conv2dConfig}, pool::{MaxPool2d, MaxPool2dConfig}, - Dropout, DropoutConfig, Linear, LinearConfig, PaddingConfig2d, ReLU, + Dropout, DropoutConfig, Linear, LinearConfig, PaddingConfig2d, Relu, }, tensor::{backend::Backend, Device, Tensor}, }; @@ -23,8 +23,8 @@ use burn::{ // │ maxpool │ // └────────────────────┘ #[derive(Module, Debug)] -pub struct CNN { - activation: ReLU, +pub struct Cnn { + activation: Relu, dropout: Dropout, pool: MaxPool2d, conv1: Conv2d, @@ -37,7 +37,7 @@ pub struct CNN { fc2: Linear, } -impl CNN { +impl Cnn { pub fn new(num_classes: usize, device: &Device) -> Self { let conv1 = Conv2dConfig::new([3, 32], [3, 3]) .with_padding(PaddingConfig2d::Same) @@ -68,7 +68,7 @@ impl CNN { let dropout = DropoutConfig::new(0.3).init(); Self { - activation: ReLU::new(), + activation: Relu::new(), dropout, pool, conv1, diff --git a/examples/custom-image-dataset/src/training.rs b/examples/custom-image-dataset/src/training.rs index 5f012377fc..11bfdf522e 100644 --- a/examples/custom-image-dataset/src/training.rs +++ b/examples/custom-image-dataset/src/training.rs @@ -3,7 +3,7 @@ use std::time::Instant; use crate::{ data::{ClassificationBatch, ClassificationBatcher}, dataset::CIFAR10Loader, - model::CNN, + model::Cnn, }; use burn::data::{dataloader::DataLoaderBuilder, dataset::vision::ImageFolderDataset}; use burn::train::{ @@ -26,7 +26,7 @@ use burn::{ const NUM_CLASSES: u8 = 10; const ARTIFACT_DIR: &str = "/tmp/custom-image-dataset"; -impl CNN { +impl Cnn { pub fn forward_classification( &self, images: Tensor, @@ -41,7 +41,7 @@ impl CNN { } } -impl TrainStep, ClassificationOutput> for CNN { +impl TrainStep, ClassificationOutput> for Cnn { fn step(&self, batch: ClassificationBatch) -> TrainOutput> { let item = self.forward_classification(batch.images, batch.targets); @@ -49,7 +49,7 @@ impl TrainStep, ClassificationOutput< } } -impl ValidStep, ClassificationOutput> for CNN { +impl ValidStep, ClassificationOutput> for Cnn { fn step(&self, batch: ClassificationBatch) -> ClassificationOutput { self.forward_classification(batch.images, batch.targets) } @@ -104,7 +104,7 @@ pub fn train(config: TrainingConfig, device: B::Device) { .devices(vec![device.clone()]) .num_epochs(config.num_epochs) .build( - CNN::new(NUM_CLASSES.into(), &device), + Cnn::new(NUM_CLASSES.into(), &device), config.optimizer.init(), config.learning_rate, ); diff --git a/examples/custom-renderer/src/lib.rs b/examples/custom-renderer/src/lib.rs index 30078c8116..c6d84750b7 100644 --- a/examples/custom-renderer/src/lib.rs +++ b/examples/custom-renderer/src/lib.rs @@ -1,11 +1,11 @@ -use burn::data::dataset::vision::MNISTDataset; +use burn::data::dataset::vision::MnistDataset; use burn::train::renderer::{MetricState, MetricsRenderer, TrainingProgress}; use burn::train::LearnerBuilder; use burn::{ config::Config, data::dataloader::DataLoaderBuilder, optim::AdamConfig, tensor::backend::AutodiffBackend, }; -use guide::{data::MNISTBatcher, model::ModelConfig}; +use guide::{data::MnistBatcher, model::ModelConfig}; #[derive(Config)] pub struct MnistTrainingConfig { @@ -52,21 +52,21 @@ pub fn run(device: B::Device) { let optim = config.optimizer.init(); // Create the batcher. - let batcher_train = MNISTBatcher::::new(device.clone()); - let batcher_valid = MNISTBatcher::::new(device.clone()); + let batcher_train = MnistBatcher::::new(device.clone()); + let batcher_valid = MnistBatcher::::new(device.clone()); // Create the dataloaders. let dataloader_train = DataLoaderBuilder::new(batcher_train) .batch_size(config.batch_size) .shuffle(config.seed) .num_workers(config.num_workers) - .build(MNISTDataset::train()); + .build(MnistDataset::train()); let dataloader_test = DataLoaderBuilder::new(batcher_valid) .batch_size(config.batch_size) .shuffle(config.seed) .num_workers(config.num_workers) - .build(MNISTDataset::test()); + .build(MnistDataset::test()); // artifact dir does not need to be provided when log_to_file is false let builder = LearnerBuilder::new("") diff --git a/examples/custom-training-loop/src/lib.rs b/examples/custom-training-loop/src/lib.rs index cfb702015a..ea91839207 100644 --- a/examples/custom-training-loop/src/lib.rs +++ b/examples/custom-training-loop/src/lib.rs @@ -1,6 +1,6 @@ use std::marker::PhantomData; -use burn::data::dataset::vision::MNISTDataset; +use burn::data::dataset::vision::MnistDataset; use burn::{ config::Config, data::dataloader::DataLoaderBuilder, @@ -13,7 +13,7 @@ use burn::{ }, }; use guide::{ - data::{MNISTBatch, MNISTBatcher}, + data::{MnistBatch, MnistBatcher}, model::{Model, ModelConfig}, }; @@ -46,21 +46,21 @@ pub fn run(device: B::Device) { let mut optim = config.optimizer.init(); // Create the batcher. - let batcher_train = MNISTBatcher::::new(device.clone()); - let batcher_valid = MNISTBatcher::::new(device.clone()); + let batcher_train = MnistBatcher::::new(device.clone()); + let batcher_valid = MnistBatcher::::new(device.clone()); // Create the dataloaders. let dataloader_train = DataLoaderBuilder::new(batcher_train) .batch_size(config.batch_size) .shuffle(config.seed) .num_workers(config.num_workers) - .build(MNISTDataset::train()); + .build(MnistDataset::train()); let dataloader_test = DataLoaderBuilder::new(batcher_valid) .batch_size(config.batch_size) .shuffle(config.seed) .num_workers(config.num_workers) - .build(MNISTDataset::test()); + .build(MnistDataset::test()); // Iterate over our training and validation loop for X epochs. for epoch in 1..config.num_epochs + 1 { @@ -145,7 +145,7 @@ where B: AutodiffBackend, O: Optimizer, B>, { - pub fn step1(&mut self, _batch: MNISTBatch) { + pub fn step1(&mut self, _batch: MnistBatch) { // } } @@ -156,14 +156,14 @@ where B: AutodiffBackend, O: Optimizer, B>, { - pub fn step2(&mut self, _batch: MNISTBatch) { + pub fn step2(&mut self, _batch: MnistBatch) { // } } #[allow(dead_code)] impl Learner2 { - pub fn step3(&mut self, _batch: MNISTBatch) + pub fn step3(&mut self, _batch: MnistBatch) where B: AutodiffBackend, M: AutodiffModule, diff --git a/examples/guide/examples/guide.rs b/examples/guide/examples/guide.rs index 9ae3ee843b..99bf330282 100644 --- a/examples/guide/examples/guide.rs +++ b/examples/guide/examples/guide.rs @@ -18,7 +18,7 @@ fn main() { guide::inference::infer::( artifact_dir, device, - burn::data::dataset::vision::MNISTDataset::test() + burn::data::dataset::vision::MnistDataset::test() .get(42) .unwrap(), ); diff --git a/examples/guide/src/data.rs b/examples/guide/src/data.rs index 2d80159614..f14bad72e6 100644 --- a/examples/guide/src/data.rs +++ b/examples/guide/src/data.rs @@ -1,26 +1,26 @@ use burn::{ - data::{dataloader::batcher::Batcher, dataset::vision::MNISTItem}, + data::{dataloader::batcher::Batcher, dataset::vision::MnistItem}, tensor::{backend::Backend, Data, ElementConversion, Int, Tensor}, }; -pub struct MNISTBatcher { +pub struct MnistBatcher { device: B::Device, } -impl MNISTBatcher { +impl MnistBatcher { pub fn new(device: B::Device) -> Self { Self { device } } } #[derive(Clone, Debug)] -pub struct MNISTBatch { +pub struct MnistBatch { pub images: Tensor, pub targets: Tensor, } -impl Batcher> for MNISTBatcher { - fn batch(&self, items: Vec) -> MNISTBatch { +impl Batcher> for MnistBatcher { + fn batch(&self, items: Vec) -> MnistBatch { let images = items .iter() .map(|item| Data::::from(item.image)) @@ -40,6 +40,6 @@ impl Batcher> for MNISTBatcher { let images = Tensor::cat(images, 0); let targets = Tensor::cat(targets, 0); - MNISTBatch { images, targets } + MnistBatch { images, targets } } } diff --git a/examples/guide/src/inference.rs b/examples/guide/src/inference.rs index 80db2d864b..e93ecd767d 100644 --- a/examples/guide/src/inference.rs +++ b/examples/guide/src/inference.rs @@ -1,5 +1,5 @@ -use crate::{data::MNISTBatcher, training::TrainingConfig}; -use burn::data::dataset::vision::MNISTItem; +use crate::{data::MnistBatcher, training::TrainingConfig}; +use burn::data::dataset::vision::MnistItem; use burn::{ config::Config, data::dataloader::batcher::Batcher, @@ -7,7 +7,7 @@ use burn::{ tensor::backend::Backend, }; -pub fn infer(artifact_dir: &str, device: B::Device, item: MNISTItem) { +pub fn infer(artifact_dir: &str, device: B::Device, item: MnistItem) { let config = TrainingConfig::load(format!("{artifact_dir}/config.json")) .expect("Config should exist for the model"); let record = CompactRecorder::new() @@ -17,7 +17,7 @@ pub fn infer(artifact_dir: &str, device: B::Device, item: MNISTItem) let model = config.model.init_with::(record); let label = item.label; - let batcher = MNISTBatcher::new(device); + let batcher = MnistBatcher::new(device); let batch = batcher.batch(vec![item]); let output = model.forward(batch.images); let predicted = output.argmax(1).flatten::<1>(0, 1).into_scalar(); diff --git a/examples/guide/src/model.rs b/examples/guide/src/model.rs index 9db5ebd001..d0405757d8 100644 --- a/examples/guide/src/model.rs +++ b/examples/guide/src/model.rs @@ -4,7 +4,7 @@ use burn::{ nn::{ conv::{Conv2d, Conv2dConfig}, pool::{AdaptiveAvgPool2d, AdaptiveAvgPool2dConfig}, - Dropout, DropoutConfig, Linear, LinearConfig, ReLU, + Dropout, DropoutConfig, Linear, LinearConfig, Relu, }, tensor::{backend::Backend, Tensor}, }; @@ -17,7 +17,7 @@ pub struct Model { dropout: Dropout, linear1: Linear, linear2: Linear, - activation: ReLU, + activation: Relu, } #[derive(Config, Debug)] @@ -35,7 +35,7 @@ impl ModelConfig { conv1: Conv2dConfig::new([1, 8], [3, 3]).init(device), conv2: Conv2dConfig::new([8, 16], [3, 3]).init(device), pool: AdaptiveAvgPool2dConfig::new([8, 8]).init(), - activation: ReLU::new(), + activation: Relu::new(), linear1: LinearConfig::new(16 * 8 * 8, self.hidden_size).init(device), linear2: LinearConfig::new(self.hidden_size, self.num_classes).init(device), dropout: DropoutConfig::new(self.dropout).init(), @@ -47,7 +47,7 @@ impl ModelConfig { conv1: Conv2dConfig::new([1, 8], [3, 3]).init_with(record.conv1), conv2: Conv2dConfig::new([8, 16], [3, 3]).init_with(record.conv2), pool: AdaptiveAvgPool2dConfig::new([8, 8]).init(), - activation: ReLU::new(), + activation: Relu::new(), linear1: LinearConfig::new(16 * 8 * 8, self.hidden_size).init_with(record.linear1), linear2: LinearConfig::new(self.hidden_size, self.num_classes) .init_with(record.linear2), diff --git a/examples/guide/src/training.rs b/examples/guide/src/training.rs index a0f0accb0f..4ebd7e6e4b 100644 --- a/examples/guide/src/training.rs +++ b/examples/guide/src/training.rs @@ -1,8 +1,8 @@ use crate::{ - data::{MNISTBatch, MNISTBatcher}, + data::{MnistBatch, MnistBatcher}, model::{Model, ModelConfig}, }; -use burn::data::dataset::vision::MNISTDataset; +use burn::data::dataset::vision::MnistDataset; use burn::train::{ metric::{AccuracyMetric, LossMetric}, ClassificationOutput, LearnerBuilder, TrainOutput, TrainStep, ValidStep, @@ -36,16 +36,16 @@ impl Model { } } -impl TrainStep, ClassificationOutput> for Model { - fn step(&self, batch: MNISTBatch) -> TrainOutput> { +impl TrainStep, ClassificationOutput> for Model { + fn step(&self, batch: MnistBatch) -> TrainOutput> { let item = self.forward_classification(batch.images, batch.targets); TrainOutput::new(self, item.loss.backward(), item) } } -impl ValidStep, ClassificationOutput> for Model { - fn step(&self, batch: MNISTBatch) -> ClassificationOutput { +impl ValidStep, ClassificationOutput> for Model { + fn step(&self, batch: MnistBatch) -> ClassificationOutput { self.forward_classification(batch.images, batch.targets) } } @@ -74,20 +74,20 @@ pub fn train(artifact_dir: &str, config: TrainingConfig, dev B::seed(config.seed); - let batcher_train = MNISTBatcher::::new(device.clone()); - let batcher_valid = MNISTBatcher::::new(device.clone()); + let batcher_train = MnistBatcher::::new(device.clone()); + let batcher_valid = MnistBatcher::::new(device.clone()); let dataloader_train = DataLoaderBuilder::new(batcher_train) .batch_size(config.batch_size) .shuffle(config.seed) .num_workers(config.num_workers) - .build(MNISTDataset::train()); + .build(MnistDataset::train()); let dataloader_test = DataLoaderBuilder::new(batcher_valid) .batch_size(config.batch_size) .shuffle(config.seed) .num_workers(config.num_workers) - .build(MNISTDataset::test()); + .build(MnistDataset::test()); let learner = LearnerBuilder::new(artifact_dir) .metric_train_numeric(AccuracyMetric::new()) diff --git a/examples/mnist/src/data.rs b/examples/mnist/src/data.rs index 68fbbc2d63..03d8682974 100644 --- a/examples/mnist/src/data.rs +++ b/examples/mnist/src/data.rs @@ -1,26 +1,26 @@ use burn::{ - data::{dataloader::batcher::Batcher, dataset::vision::MNISTItem}, + data::{dataloader::batcher::Batcher, dataset::vision::MnistItem}, tensor::{backend::Backend, Data, ElementConversion, Int, Tensor}, }; -pub struct MNISTBatcher { +pub struct MnistBatcher { device: B::Device, } #[derive(Clone, Debug)] -pub struct MNISTBatch { +pub struct MnistBatch { pub images: Tensor, pub targets: Tensor, } -impl MNISTBatcher { +impl MnistBatcher { pub fn new(device: B::Device) -> Self { Self { device } } } -impl Batcher> for MNISTBatcher { - fn batch(&self, items: Vec) -> MNISTBatch { +impl Batcher> for MnistBatcher { + fn batch(&self, items: Vec) -> MnistBatch { let images = items .iter() .map(|item| Data::::from(item.image)) @@ -45,6 +45,6 @@ impl Batcher> for MNISTBatcher { let images = Tensor::cat(images, 0); let targets = Tensor::cat(targets, 0); - MNISTBatch { images, targets } + MnistBatch { images, targets } } } diff --git a/examples/mnist/src/model.rs b/examples/mnist/src/model.rs index ff254d4bc1..e6090fd843 100644 --- a/examples/mnist/src/model.rs +++ b/examples/mnist/src/model.rs @@ -1,4 +1,4 @@ -use crate::data::MNISTBatch; +use crate::data::MnistBatch; use burn::{ module::Module, nn::{self, loss::CrossEntropyLossConfig, BatchNorm, PaddingConfig2d}, @@ -73,7 +73,7 @@ impl Model { self.fc2.forward(x) } - pub fn forward_classification(&self, item: MNISTBatch) -> ClassificationOutput { + pub fn forward_classification(&self, item: MnistBatch) -> ClassificationOutput { let targets = item.targets; let output = self.forward(item.images); let loss = CrossEntropyLossConfig::new() @@ -117,16 +117,16 @@ impl ConvBlock { } } -impl TrainStep, ClassificationOutput> for Model { - fn step(&self, item: MNISTBatch) -> TrainOutput> { +impl TrainStep, ClassificationOutput> for Model { + fn step(&self, item: MnistBatch) -> TrainOutput> { let item = self.forward_classification(item); TrainOutput::new(self, item.loss.backward(), item) } } -impl ValidStep, ClassificationOutput> for Model { - fn step(&self, item: MNISTBatch) -> ClassificationOutput { +impl ValidStep, ClassificationOutput> for Model { + fn step(&self, item: MnistBatch) -> ClassificationOutput { self.forward_classification(item) } } diff --git a/examples/mnist/src/training.rs b/examples/mnist/src/training.rs index c1c1c68efa..ace04d4f88 100644 --- a/examples/mnist/src/training.rs +++ b/examples/mnist/src/training.rs @@ -1,4 +1,4 @@ -use crate::data::MNISTBatcher; +use crate::data::MnistBatcher; use crate::model::Model; use burn::module::Module; @@ -10,7 +10,7 @@ use burn::train::metric::{CpuMemory, CpuTemperature, CpuUse}; use burn::train::{MetricEarlyStoppingStrategy, StoppingCondition}; use burn::{ config::Config, - data::{dataloader::DataLoaderBuilder, dataset::vision::MNISTDataset}, + data::{dataloader::DataLoaderBuilder, dataset::vision::MnistDataset}, tensor::backend::AutodiffBackend, train::{ metric::{AccuracyMetric, LossMetric}, @@ -44,19 +44,19 @@ pub fn run(device: B::Device) { B::seed(config.seed); // Data - let batcher_train = MNISTBatcher::::new(device.clone()); - let batcher_valid = MNISTBatcher::::new(device.clone()); + let batcher_train = MnistBatcher::::new(device.clone()); + let batcher_valid = MnistBatcher::::new(device.clone()); let dataloader_train = DataLoaderBuilder::new(batcher_train) .batch_size(config.batch_size) .shuffle(config.seed) .num_workers(config.num_workers) - .build(MNISTDataset::train()); + .build(MnistDataset::train()); let dataloader_test = DataLoaderBuilder::new(batcher_valid) .batch_size(config.batch_size) .shuffle(config.seed) .num_workers(config.num_workers) - .build(MNISTDataset::test()); + .build(MnistDataset::test()); // Model let learner = LearnerBuilder::new(ARTIFACT_DIR) diff --git a/examples/onnx-inference/src/bin/mnist_inference.rs b/examples/onnx-inference/src/bin/mnist_inference.rs index f4851beea8..623f197c31 100644 --- a/examples/onnx-inference/src/bin/mnist_inference.rs +++ b/examples/onnx-inference/src/bin/mnist_inference.rs @@ -3,7 +3,7 @@ use std::env::args; use burn::backend::ndarray::NdArray; use burn::tensor::Tensor; -use burn::data::dataset::vision::MNISTDataset; +use burn::data::dataset::vision::MnistDataset; use burn::data::dataset::Dataset; use onnx_inference::mnist::Model; @@ -34,7 +34,7 @@ fn main() { let model: Model = Model::default(); // Load the MNIST dataset and get an item - let dataset = MNISTDataset::test(); + let dataset = MnistDataset::test(); let item = dataset.get(image_index).unwrap(); // Create a tensor from the image data diff --git a/examples/pytorch-import/src/main.rs b/examples/pytorch-import/src/main.rs index 3a7567ce9f..1dafce410c 100644 --- a/examples/pytorch-import/src/main.rs +++ b/examples/pytorch-import/src/main.rs @@ -5,7 +5,7 @@ use burn::backend::ndarray::NdArray; use burn::record::{FullPrecisionSettings, NamedMpkFileRecorder, Recorder}; use burn::tensor::Tensor; -use burn::data::dataset::vision::MNISTDataset; +use burn::data::dataset::vision::MnistDataset; use burn::data::dataset::Dataset; use model::Model; @@ -42,7 +42,7 @@ fn main() { let model: Model = Model::new_with(record); // Load the MNIST dataset and get an item - let dataset = MNISTDataset::test(); + let dataset = MnistDataset::test(); let item = dataset.get(image_index).unwrap(); // Create a tensor from the image data diff --git a/examples/simple-regression/src/model.rs b/examples/simple-regression/src/model.rs index 05ff944ee6..244072401d 100644 --- a/examples/simple-regression/src/model.rs +++ b/examples/simple-regression/src/model.rs @@ -1,10 +1,10 @@ use crate::dataset::DiabetesBatch; use burn::config::Config; use burn::nn::loss::Reduction::Mean; -use burn::nn::ReLU; +use burn::nn::Relu; use burn::{ module::Module, - nn::{loss::MSELoss, Linear, LinearConfig}, + nn::{loss::MseLoss, Linear, LinearConfig}, tensor::{ backend::{AutodiffBackend, Backend}, Tensor, @@ -16,7 +16,7 @@ use burn::{ pub struct RegressionModel { input_layer: Linear, output_layer: Linear, - activation: ReLU, + activation: Relu, } #[derive(Config)] @@ -39,7 +39,7 @@ impl RegressionModelConfig { RegressionModel { input_layer, output_layer, - activation: ReLU::new(), + activation: Relu::new(), } } } @@ -56,7 +56,7 @@ impl RegressionModel { let targets: Tensor = item.targets.unsqueeze(); let output: Tensor = self.forward(item.inputs); - let loss = MSELoss::new().forward(output.clone(), targets.clone(), Mean); + let loss = MseLoss::new().forward(output.clone(), targets.clone(), Mean); RegressionOutput { loss, diff --git a/examples/text-classification/src/training.rs b/examples/text-classification/src/training.rs index 8a101847b4..f0a279693c 100644 --- a/examples/text-classification/src/training.rs +++ b/examples/text-classification/src/training.rs @@ -19,7 +19,7 @@ use burn::{ record::{CompactRecorder, Recorder}, tensor::backend::AutodiffBackend, train::{ - metric::{AccuracyMetric, CUDAMetric, LearningRateMetric, LossMetric}, + metric::{AccuracyMetric, CudaMetric, LearningRateMetric, LossMetric}, LearnerBuilder, }, }; @@ -91,8 +91,8 @@ pub fn train( // Initialize learner let learner = LearnerBuilder::new(artifact_dir) - .metric_train(CUDAMetric::new()) - .metric_valid(CUDAMetric::new()) + .metric_train(CudaMetric::new()) + .metric_valid(CudaMetric::new()) .metric_train_numeric(AccuracyMetric::new()) .metric_valid_numeric(AccuracyMetric::new()) .metric_train_numeric(LossMetric::new()) diff --git a/examples/text-generation/src/training.rs b/examples/text-generation/src/training.rs index d437960ad1..f7f4443488 100644 --- a/examples/text-generation/src/training.rs +++ b/examples/text-generation/src/training.rs @@ -13,7 +13,7 @@ use burn::{ record::{CompactRecorder, DefaultRecorder, Recorder}, tensor::backend::AutodiffBackend, train::{ - metric::{AccuracyMetric, CUDAMetric, LearningRateMetric, LossMetric}, + metric::{AccuracyMetric, CudaMetric, LearningRateMetric, LossMetric}, LearnerBuilder, }, }; @@ -68,8 +68,8 @@ pub fn train + 'static>( .init(); let learner = LearnerBuilder::new(artifact_dir) - .metric_train(CUDAMetric::new()) - .metric_valid(CUDAMetric::new()) + .metric_train(CudaMetric::new()) + .metric_valid(CudaMetric::new()) .metric_train_numeric(AccuracyMetric::new().with_pad_token(tokenizer.pad_token())) .metric_valid_numeric(AccuracyMetric::new().with_pad_token(tokenizer.pad_token())) .metric_train(LossMetric::new())