nabla_ml/
nab_regression.rs

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
use crate::nab_array::NDArray;
use crate::nab_loss::NabLoss;
use crate::nabla::Nabla;

impl Nabla {
    /// Performs linear regression using gradient descent with multiple features
    ///
    /// # Arguments
    ///
    /// * `X` - The input feature matrix as an NDArray.
    /// * `y` - The output target as an NDArray.
    /// * `alpha` - The learning rate.
    /// * `epochs` - The number of iterations for gradient descent.
    ///
    /// # Returns
    ///
    /// A tuple containing the optimized parameters and the history of MSE for each epoch.
    #[allow(non_snake_case)]
    #[allow(dead_code)]
    pub fn linear_regression(X: &NDArray, y: &NDArray, alpha: f64, epochs: usize) -> (Vec<f64>, Vec<f64>) {
        let N = X.shape()[0];
        let mut theta = vec![0.0; X.shape()[1] + 1]; // +1 for the intercept
        let mut history = Vec::with_capacity(epochs);

        for _ in 0..epochs {
            // Predictions
            let y_pred: Vec<f64> = (0..N).map(|i| {
                theta[0] + X.data().iter().skip(i * X.shape()[1]).take(X.shape()[1]).zip(&theta[1..]).map(|(&x, &t)| x * t).sum::<f64>()
            }).collect();

            // Calculate MSE
            let mse = NabLoss::mean_squared_error(y, &NDArray::from_vec(y_pred.clone()));
            history.push(mse);

            // Calculate gradients using nabla
            let gradients = Nabla::linear_regression_gradients(X, y, &NDArray::from_vec(y_pred), N);

            // Update parameters
            for j in 0..theta.len() {
                theta[j] -= alpha * gradients[j];
            }
        }

        (theta, history)
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use rand::Rng;

    #[test]
    #[allow(non_snake_case)]
    fn test_linear_regression() {
        let mut rng = rand::thread_rng();
        let X = NDArray::from_matrix((0..100).map(|_| vec![2.0 * rng.gen::<f64>()]).collect());
        let y = NDArray::from_vec(X.data().iter().map(|&x| 4.0 + 3.0 * x + rng.gen::<f64>()).collect());

        let (theta, history) = Nabla::linear_regression(&X, &y, 0.01, 2000);

        assert!((theta[0] - 4.0).abs() < 1.0);
        assert!((theta[1] - 3.0).abs() < 1.0);
        assert!(history.first().unwrap() > history.last().unwrap());
    }

    #[test]
    #[allow(non_snake_case)]
    fn test_linear_regression_multiple_features() {
        // Generate a simple dataset with two features
        let X = NDArray::from_matrix(vec![
            vec![0.0, 0.0],
            vec![1.0, 0.0],
            vec![0.0, 1.0],
            vec![1.0, 1.0],
            vec![2.0, 1.0],
            vec![1.0, 2.0],
            vec![2.0, 2.0],
        ]);
        let y = NDArray::from_vec(vec![1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0]); // y = 1 + 1*x1 + 2*x2

        // Apply linear regression
        let (theta, history) = Nabla::linear_regression(&X, &y, 0.01, 1000);

        println!("{:?}", theta[0]);
        println!("{:?}", theta[1]);
        println!("{:?}", theta[2]);

        // Check if the parameters are close to the expected values
        assert!((theta[0] - 1.0).abs() < 0.1);  // Increased tolerance
        assert!((theta[1] - 1.0).abs() < 0.1);  // Coefficient for x1
        assert!((theta[2] - 2.0).abs() < 0.1);  // Coefficient for x2

        // Ensure the loss decreases over time
        assert!(history.first().unwrap() > history.last().unwrap());
    }

}