pub fn adaptive_learning_rate( base_lr: f64, gradient_norm: f64, avg_gradient_norm: f64, min_lr: f64, max_lr: f64, ) -> f64
Adaptive learning rate based on gradient history