Add Conv2d (#124)

* (#1) Adding conv2d function * Adding Conv2D layer * Adding SaveToNpz and LoadFromNpz for conv * Adding batch_conv2d * Adding another placeholder test * Testing default conv2d * Testing conv stride 2 * Testing stride 1 * Using checked_sub in conv again instead of a bunch of ifs * Testing conv padding & stride bigger than kernel * Testing batch conv2d with 1x1 conv * Adding tests for Conv2D layer * Adding docstrings and updating UpdateWithGrads * Adding conv test with optimizer * Changing Flatten to FlattenImage * Adding example conv net * Ignoring docstring for FlattenImage * Adding cfg blocks with conv_net example * optimizing conv forward & backward a bit * Backward slightly faster * Slightly cleaning up conv impls * more small improvements to conv backward
coreylowman · Aug 20, 2022 · a2024ac · a2024ac
1 parent 8da0e44
commit a2024ac
Show file tree

Hide file tree

Showing 7 changed files with 904 additions and 37 deletions.
diff --git a/examples/conv_net.rs b/examples/conv_net.rs
@@ -0,0 +1,32 @@
+#![cfg_attr(feature = "nightly", feature(generic_const_exprs))]
+
+#[cfg(not(feature = "nightly"))]
+fn main() {
+    panic!("`+nightly` required to run this example.")
+}
+
+#[cfg(feature = "nightly")]
+fn main() {
+    use dfdx::prelude::*;
+    use rand::thread_rng;
+
+    type Model = (
+        (Conv2D<3, 4, 3>, ReLU),
+        (Conv2D<4, 8, 3>, ReLU),
+        (Conv2D<8, 16, 3>, ReLU),
+        FlattenImage,
+        Linear<7744, 10>,
+    );
+
+    let mut rng = thread_rng();
+    let mut m: Model = Default::default();
+    m.reset_params(&mut rng);
+
+    // single image forward
+    let x: Tensor3D<3, 28, 28> = TensorCreator::randn(&mut rng);
+    let _: Tensor1D<10> = m.forward(x);
+
+    // batched image forward
+    let x: Tensor4D<32, 3, 28, 28> = TensorCreator::randn(&mut rng);
+    let _: Tensor2D<32, 10> = m.forward(x);
+}
diff --git a/src/gradients.rs b/src/gradients.rs
@@ -152,6 +152,31 @@ impl Gradients {
         (l_ref, r_ref)
     }
 
+    pub fn muts_and_ref<L1, L2, L3, R>(
+        &mut self,
+        l1: &L1,
+        l2: &L2,
+        l3: &L3,
+        r: &R,
+    ) -> (&mut L1::Array, &mut L2::Array, &mut L3::Array, &R::Array)
+    where
+        L1: HasUniqueId + HasArrayType + HasDevice,
+        L2: HasUniqueId + HasArrayType + HasDevice,
+        L3: HasUniqueId + HasArrayType + HasDevice,
+        R: HasUniqueId + HasArrayType,
+    {
+        // assert_ne!(l1.id(), r.id());
+        let l1_ptr = self.mut_gradient(l1) as *mut L1::Array;
+        let l2_ptr = self.mut_gradient(l2) as *mut L2::Array;
+        let l3_ptr = self.mut_gradient(l3) as *mut L3::Array;
+        let r_ptr = self.ref_gradient(r) as *const R::Array;
+        let l1_ref = unsafe { &mut *l1_ptr };
+        let l2_ref = unsafe { &mut *l2_ptr };
+        let l3_ref = unsafe { &mut *l3_ptr };
+        let r_ref = unsafe { &*r_ptr };
+        (l1_ref, l2_ref, l3_ref, r_ref)
+    }
+
     /// Removes and returns the data associated with `t.id()`.
     ///
     /// **Panics** if data associated with `t` is not found. This indicates an unrecoverable bug.

diff --git a/src/nn/conv.rs b/src/nn/conv.rs
@@ -0,0 +1,294 @@
+use crate::prelude::*;
+use rand::Rng;
+use rand_distr::Uniform;
+use std::io::{Read, Seek, Write};
+use zip::{result::ZipResult, ZipArchive, ZipWriter};
+
+/// **Requires Nightly** Performs 2d convolutions on 3d and 4d images.
+///
+/// **Pytorch Equivalent**: `torch.nn.Conv2d`
+///
+/// Generics:
+/// - `IN_CHAN`: The number of input channels in an image.
+/// - `OUT_CHAN`: The number of channels in the output of the layer.
+/// - `KERNEL_SIZE`: The size of the kernel applied to both width and height of the images.
+/// - `STRIDE`: How far to move the kernel each step. Defaults to `1`
+/// - `PADDING`: How much zero padding to add around the images. Defaults to `0`.
+///
+/// Examples:
+/// ```rust
+/// #![feature(generic_const_exprs)]
+/// # use dfdx::prelude::*;
+/// let m: Conv2D<16, 33, 3> = Default::default();
+/// let _: Tensor3D<33, 30, 62> = m.forward(Tensor3D::<16, 32, 64>::zeros());
+/// let _: Tensor4D<2, 33, 13, 12> = m.forward(Tensor4D::<2, 16, 15, 14>::zeros());
+/// ```
+#[derive(Default, Debug, Clone)]
+pub struct Conv2D<
+    const IN_CHAN: usize,
+    const OUT_CHAN: usize,
+    const KERNEL_SIZE: usize,
+    const STRIDE: usize = 1,
+    const PADDING: usize = 0,
+> {
+    pub weight: Tensor4D<OUT_CHAN, IN_CHAN, KERNEL_SIZE, KERNEL_SIZE>,
+    pub bias: Tensor1D<OUT_CHAN>,
+}
+
+impl<
+        const IN_CHAN: usize,
+        const OUT_CHAN: usize,
+        const KERNEL_SIZE: usize,
+        const STRIDE: usize,
+        const PADDING: usize,
+    > CanUpdateWithGradients for Conv2D<IN_CHAN, OUT_CHAN, KERNEL_SIZE, STRIDE, PADDING>
+{
+    fn update<G: GradientProvider>(&mut self, grads: &mut G, unused: &mut UnusedTensors) {
+        self.weight.update(grads, unused);
+        self.bias.update(grads, unused);
+    }
+}
+
+impl<
+        const IN_CHAN: usize,
+        const OUT_CHAN: usize,
+        const KERNEL_SIZE: usize,
+        const STRIDE: usize,
+        const PADDING: usize,
+    > ResetParams for Conv2D<IN_CHAN, OUT_CHAN, KERNEL_SIZE, STRIDE, PADDING>
+{
+    fn reset_params<R: Rng>(&mut self, rng: &mut R) {
+        let k = (IN_CHAN * KERNEL_SIZE * KERNEL_SIZE) as f32;
+        let bound = 1.0 / k.sqrt();
+        let dist = Uniform::new(-bound, bound);
+        self.weight.randomize(rng, &dist);
+        self.bias.randomize(rng, &dist);
+    }
+}
+
+impl<
+        const IN_CHAN: usize,
+        const OUT_CHAN: usize,
+        const KERNEL_SIZE: usize,
+        const STRIDE: usize,
+        const PADDING: usize,
+    > SaveToNpz for Conv2D<IN_CHAN, OUT_CHAN, KERNEL_SIZE, STRIDE, PADDING>
+{
+    /// Saves [Self::weight] to `{pre}weight.npy` and [Self::bias] to `{pre}bias.npy`
+    /// using [npz_fwrite()].
+    fn write<W>(&self, pre: &str, w: &mut ZipWriter<W>) -> ZipResult<()>
+    where
+        W: Write + Seek,
+    {
+        npz_fwrite(w, format!("{pre}weight.npy"), self.weight.data())?;
+        npz_fwrite(w, format!("{pre}bias.npy"), self.bias.data())?;
+        Ok(())
+    }
+}
+
+impl<
+        const IN_CHAN: usize,
+        const OUT_CHAN: usize,
+        const KERNEL_SIZE: usize,
+        const STRIDE: usize,
+        const PADDING: usize,
+    > LoadFromNpz for Conv2D<IN_CHAN, OUT_CHAN, KERNEL_SIZE, STRIDE, PADDING>
+{
+    /// Reads [Self::weight] from `{pre}weight.npy` and [Self::bias] from `{pre}bias.npy`
+    /// using [npz_fread()].
+    fn read<R>(&mut self, pre: &str, r: &mut ZipArchive<R>) -> Result<(), NpzError>
+    where
+        R: Read + Seek,
+    {
+        npz_fread(r, format!("{pre}weight.npy"), self.weight.mut_data())?;
+        npz_fread(r, format!("{pre}bias.npy"), self.bias.mut_data())?;
+        Ok(())
+    }
+}
+
+impl<
+        TAPE: 'static + Tape,
+        const IN_CHAN: usize,
+        const OUT_CHAN: usize,
+        const KERNEL_SIZE: usize,
+        const STRIDE: usize,
+        const PADDING: usize,
+        const IN_HEIGHT: usize,
+        const IN_WIDTH: usize,
+    > Module<Tensor3D<IN_CHAN, IN_HEIGHT, IN_WIDTH, TAPE>>
+    for Conv2D<IN_CHAN, OUT_CHAN, KERNEL_SIZE, STRIDE, PADDING>
+where
+    [(); (IN_WIDTH + 2 * PADDING - KERNEL_SIZE) / STRIDE + 1]:,
+    [(); (IN_HEIGHT + 2 * PADDING - KERNEL_SIZE) / STRIDE + 1]:,
+{
+    type Output = Tensor3D<
+        OUT_CHAN,
+        { (IN_HEIGHT + 2 * PADDING - KERNEL_SIZE) / STRIDE + 1 },
+        { (IN_WIDTH + 2 * PADDING - KERNEL_SIZE) / STRIDE + 1 },
+        TAPE,
+    >;
+
+    fn forward(&self, x: Tensor3D<IN_CHAN, IN_HEIGHT, IN_WIDTH, TAPE>) -> Self::Output {
+        conv2d::<TAPE, IN_CHAN, OUT_CHAN, KERNEL_SIZE, STRIDE, PADDING, IN_HEIGHT, IN_WIDTH>(
+            x,
+            &self.weight,
+            &self.bias,
+        )
+    }
+}
+
+impl<
+        TAPE: 'static + Tape,
+        const BATCH_SIZE: usize,
+        const IN_CHAN: usize,
+        const OUT_CHAN: usize,
+        const KERNEL_SIZE: usize,
+        const STRIDE: usize,
+        const PADDING: usize,
+        const IN_HEIGHT: usize,
+        const IN_WIDTH: usize,
+    > Module<Tensor4D<BATCH_SIZE, IN_CHAN, IN_HEIGHT, IN_WIDTH, TAPE>>
+    for Conv2D<IN_CHAN, OUT_CHAN, KERNEL_SIZE, STRIDE, PADDING>
+where
+    [(); (IN_WIDTH + 2 * PADDING - KERNEL_SIZE) / STRIDE + 1]:,
+    [(); (IN_HEIGHT + 2 * PADDING - KERNEL_SIZE) / STRIDE + 1]:,
+{
+    type Output = Tensor4D<
+        BATCH_SIZE,
+        OUT_CHAN,
+        { (IN_HEIGHT + 2 * PADDING - KERNEL_SIZE) / STRIDE + 1 },
+        { (IN_WIDTH + 2 * PADDING - KERNEL_SIZE) / STRIDE + 1 },
+        TAPE,
+    >;
+
+    fn forward(&self, x: Tensor4D<BATCH_SIZE, IN_CHAN, IN_HEIGHT, IN_WIDTH, TAPE>) -> Self::Output {
+        conv2d_batched::<
+            TAPE,
+            BATCH_SIZE,
+            IN_CHAN,
+            OUT_CHAN,
+            KERNEL_SIZE,
+            STRIDE,
+            PADDING,
+            IN_HEIGHT,
+            IN_WIDTH,
+        >(x, &self.weight, &self.bias)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use rand::thread_rng;
+    use std::fs::File;
+    use tempfile::NamedTempFile;
+
+    #[test]
+    fn test_forward_3d_sizes() {
+        type Img = Tensor3D<3, 10, 10>;
+        let _: Tensor3D<2, 8, 8> = Conv2D::<3, 2, 3>::default().forward(Img::zeros());
+        let _: Tensor3D<4, 8, 8> = Conv2D::<3, 4, 3>::default().forward(Img::zeros());
+        let _: Tensor3D<4, 9, 9> = Conv2D::<3, 4, 2>::default().forward(Img::zeros());
+        let _: Tensor3D<4, 7, 7> = Conv2D::<3, 4, 4>::default().forward(Img::zeros());
+        let _: Tensor3D<2, 4, 4> = Conv2D::<3, 2, 3, 2>::default().forward(Img::zeros());
+        let _: Tensor3D<2, 3, 3> = Conv2D::<3, 2, 3, 3>::default().forward(Img::zeros());
+        let _: Tensor3D<2, 10, 10> = Conv2D::<3, 2, 3, 1, 1>::default().forward(Img::zeros());
+        let _: Tensor3D<2, 12, 12> = Conv2D::<3, 2, 3, 1, 2>::default().forward(Img::zeros());
+        let _: Tensor3D<2, 6, 6> = Conv2D::<3, 2, 3, 2, 2>::default().forward(Img::zeros());
+    }
+
+    #[test]
+    fn test_forward_4d_sizes() {
+        type Img = Tensor4D<5, 3, 10, 10>;
+        let _: Tensor4D<5, 2, 8, 8> = Conv2D::<3, 2, 3>::default().forward(Img::zeros());
+        let _: Tensor4D<5, 4, 8, 8> = Conv2D::<3, 4, 3>::default().forward(Img::zeros());
+        let _: Tensor4D<5, 4, 9, 9> = Conv2D::<3, 4, 2>::default().forward(Img::zeros());
+        let _: Tensor4D<5, 4, 7, 7> = Conv2D::<3, 4, 4>::default().forward(Img::zeros());
+        let _: Tensor4D<5, 2, 4, 4> = Conv2D::<3, 2, 3, 2>::default().forward(Img::zeros());
+        let _: Tensor4D<5, 2, 3, 3> = Conv2D::<3, 2, 3, 3>::default().forward(Img::zeros());
+        let _: Tensor4D<5, 2, 10, 10> = Conv2D::<3, 2, 3, 1, 1>::default().forward(Img::zeros());
+        let _: Tensor4D<5, 2, 12, 12> = Conv2D::<3, 2, 3, 1, 2>::default().forward(Img::zeros());
+        let _: Tensor4D<5, 2, 6, 6> = Conv2D::<3, 2, 3, 2, 2>::default().forward(Img::zeros());
+    }
+
+    #[test]
+    fn test_2_conv_sizes() {
+        type A = Conv2D<1, 2, 3>;
+        type B = Conv2D<2, 4, 3>;
+        let _: Tensor3D<4, 6, 6> = <(A, B)>::default().forward(Tensor3D::<1, 10, 10>::zeros());
+    }
+
+    #[test]
+    fn test_3_conv_sizes() {
+        type A = Conv2D<1, 2, 3>;
+        type B = Conv2D<2, 4, 3>;
+        type C = Conv2D<4, 1, 1, 1, 1>;
+
+        type Img = Tensor3D<1, 10, 10>;
+        let _: Tensor3D<1, 8, 8> = <(A, B, C)>::default().forward(Img::zeros());
+    }
+
+    #[test]
+    fn test_save_conv2d() {
+        let model: Conv2D<2, 4, 3> = Default::default();
+        let file = NamedTempFile::new().expect("failed to create tempfile");
+        model
+            .save(file.path().to_str().unwrap())
+            .expect("failed to save model");
+        let f = File::open(file.path()).expect("failed to open resulting file");
+        let mut zip = ZipArchive::new(f).expect("failed to create zip archive from file");
+        {
+            let weight_file = zip
+                .by_name("weight.npy")
+                .expect("failed to find weight.npy file");
+            assert!(weight_file.size() > 0);
+        }
+        {
+            let bias_file = zip
+                .by_name("bias.npy")
+                .expect("failed to find bias.npy file");
+            assert!(bias_file.size() > 0);
+        }
+    }
+
+    #[test]
+    fn test_load_conv() {
+        let mut rng = thread_rng();
+        let mut saved_model: Conv2D<2, 4, 3> = Default::default();
+        saved_model.reset_params(&mut rng);
+
+        let file = NamedTempFile::new().expect("failed to create tempfile");
+        assert!(saved_model.save(file.path().to_str().unwrap()).is_ok());
+
+        let mut loaded_model: Conv2D<2, 4, 3> = Default::default();
+        assert!(loaded_model.weight.data() != saved_model.weight.data());
+        assert!(loaded_model.bias.data() != saved_model.bias.data());
+
+        assert!(loaded_model.load(file.path().to_str().unwrap()).is_ok());
+        assert_eq!(loaded_model.weight.data(), saved_model.weight.data());
+        assert_eq!(loaded_model.bias.data(), saved_model.bias.data());
+    }
+
+    #[test]
+    fn test_conv_with_optimizer() {
+        let mut rng = thread_rng();
+
+        let mut m: Conv2D<2, 4, 3> = Default::default();
+        m.reset_params(&mut rng);
+
+        let weight_init = m.weight.clone();
+        let bias_init = m.bias.clone();
+
+        let mut opt: Sgd<_> = Default::default();
+        let out = m.forward(Tensor4D::<8, 2, 28, 28>::randn(&mut rng).trace());
+        let gradients = out.square().mean().backward();
+
+        assert_ne!(gradients.ref_gradient(&m.weight), &[[[[0.0; 3]; 3]; 2]; 4]);
+        assert_ne!(gradients.ref_gradient(&m.bias), &[0.0; 4]);
+
+        opt.update(&mut m, gradients).expect("unused params");
+
+        assert_ne!(weight_init.data(), m.weight.data());
+        assert_ne!(bias_init.data(), m.bias.data());
+    }
+}