use crate as burn;
use crate::config::Config;
use crate::module::Module;
use crate::module::Param;
use crate::nn::{Initializer, PaddingConfig1d};
use crate::tensor::backend::Backend;
use crate::tensor::Tensor;
use burn_tensor::module::conv1d;
use burn_tensor::ops::ConvOptions;
use libm::sqrt;
use super::checks;
#[derive(Config, Debug)]
pub struct Conv1dConfig {
pub channels_in: usize,
pub channels_out: usize,
pub kernel_size: usize,
#[config(default = "1")]
pub stride: usize,
#[config(default = "1")]
pub dilation: usize,
#[config(default = "1")]
pub groups: usize,
#[config(default = "PaddingConfig1d::Valid")]
pub padding: PaddingConfig1d,
#[config(default = true)]
pub bias: bool,
#[config(default = "Initializer::KaimingUniform{gain:1.0/sqrt(3.0),fan_out_only:false}")]
pub initializer: Initializer,
}
#[derive(Module, Debug)]
pub struct Conv1d<B: Backend> {
weight: Param<Tensor<B, 3>>,
bias: Option<Param<Tensor<B, 1>>>,
stride: usize,
kernel_size: usize,
dilation: usize,
groups: usize,
padding: PaddingConfig1d,
}
impl Conv1dConfig {
pub fn init<B: Backend>(&self) -> Conv1d<B> {
checks::checks_channels_div_groups(self.channels_in, self.channels_out, self.groups);
let shape = [
self.channels_out,
self.channels_in / self.groups,
self.kernel_size,
];
let fan_in: usize = self.channels_in / self.groups * self.kernel_size;
let weight = self.initializer.init_with(shape, Some(fan_in), None);
let mut bias = None;
if self.bias {
bias = Some(
self.initializer
.init_with([self.channels_out], Some(fan_in), None),
);
}
Conv1d {
weight: Param::from(weight),
bias: bias.map(Param::from),
stride: self.stride,
kernel_size: self.kernel_size,
padding: self.padding.clone(),
dilation: self.dilation,
groups: self.groups,
}
}
pub fn init_with<B: Backend>(&self, record: Conv1dRecord<B>) -> Conv1d<B> {
Conv1d {
weight: record.weight,
bias: record.bias,
stride: self.stride,
kernel_size: self.kernel_size,
padding: self.padding.clone(),
dilation: self.dilation,
groups: self.groups,
}
}
}
impl<B: Backend> Conv1d<B> {
pub fn forward(&self, input: Tensor<B, 3>) -> Tensor<B, 3> {
let [_batch_size, _channels, length] = input.dims();
let padding = self
.padding
.calculate_padding_1d(length, self.kernel_size, self.stride);
conv1d(
input,
self.weight.val(),
self.bias.as_ref().map(|bias| bias.val()),
ConvOptions::new([self.stride], [padding], [self.dilation], self.groups),
)
}
}
#[cfg(test)]
mod tests {
use super::*;
use crate::TestBackend;
use burn_tensor::Data;
#[test]
fn initializer_default() {
TestBackend::seed(0);
let config = Conv1dConfig::new(5, 5, 5);
let k = (config.channels_in * config.kernel_size) as f64;
let k = sqrt(config.groups as f64 / k) as f32;
let conv = config.init::<TestBackend>();
conv.weight.to_data().assert_within_range(-k..k);
}
#[test]
fn initializer_zeros() {
TestBackend::seed(0);
let config = Conv1dConfig::new(5, 5, 5).with_initializer(Initializer::Zeros);
let conv = config.init::<TestBackend>();
assert_eq!(config.initializer, Initializer::Zeros);
conv.weight
.to_data()
.assert_approx_eq(&Data::zeros(conv.weight.shape()), 3);
}
}