pub fn clip_gradient_norm<A, D>( gradients: &mut Array<A, D>, maxnorm: A, ) -> Result<&mut Array<A, D>>where A: Float + ScalarOperand, D: Dimension,
Clip gradient L2 norm (global gradient clipping)