fix: ridge regression, code refactoring

Volodymyr Orlov · Volodymyr Orlov · commit c42fccdc228a · 2020-11-11T15:59:04.000-08:00
diff --git a/src/linear/linear_regression.rs b/src/linear/linear_regression.rs
@@ -154,8 +154,8 @@ impl<T: RealNumber, M: Matrix<T>> LinearRegression<T, M> {
     }
 
     /// Get estimates regression coefficients
-    pub fn coefficients(&self) -> M {
-        self.coefficients.clone()
+    pub fn coefficients(&self) -> &M {
+        &self.coefficients
     }
 
     /// Get estimate of intercept
diff --git a/src/linear/logistic_regression.rs b/src/linear/logistic_regression.rs
@@ -68,7 +68,8 @@ use crate::optimization::FunctionOrder;
 /// Logistic Regression
 #[derive(Serialize, Deserialize, Debug)]
 pub struct LogisticRegression<T: RealNumber, M: Matrix<T>> {
-    weights: M,
+    coefficients: M,
+    intercept: M,
     classes: Vec<T>,
     num_attributes: usize,
     num_classes: usize,
@@ -109,7 +110,7 @@ impl<T: RealNumber, M: Matrix<T>> PartialEq for LogisticRegression<T, M> {
                 }
             }
 
-            return self.weights == other.weights;
+            return self.coefficients == other.coefficients && self.intercept == other.intercept;
         }
     }
 }
@@ -246,9 +247,11 @@ impl<T: RealNumber, M: Matrix<T>> LogisticRegression<T, M> {
             };
 
             let result = LogisticRegression::minimize(x0, objective);
+            let weights = result.x;
 
             Ok(LogisticRegression {
-                weights: result.x,
+                coefficients: weights.slice(0..1, 0..num_attributes),
+                intercept: weights.slice(0..1, num_attributes..num_attributes + 1),
                 classes: classes,
                 num_attributes: num_attributes,
                 num_classes: k,
@@ -268,7 +271,8 @@ impl<T: RealNumber, M: Matrix<T>> LogisticRegression<T, M> {
             let weights = result.x.reshape(k, num_attributes + 1);
 
             Ok(LogisticRegression {
-                weights: weights,
+                coefficients: weights.slice(0..k, 0..num_attributes),
+                intercept: weights.slice(0..k, num_attributes..num_attributes + 1),
                 classes: classes,
                 num_attributes: num_attributes,
                 num_classes: k,
@@ -283,21 +287,26 @@ impl<T: RealNumber, M: Matrix<T>> LogisticRegression<T, M> {
         let mut result = M::zeros(1, n);
         if self.num_classes == 2 {
             let (nrows, _) = x.shape();
-            let x_and_bias = x.h_stack(&M::ones(nrows, 1));
-            let y_hat: Vec<T> = x_and_bias
-                .matmul(&self.weights.transpose())
-                .get_col_as_vec(0);
+            let y_hat: Vec<T> = x.matmul(&self.coefficients.transpose()).get_col_as_vec(0);
+            let intercept = self.intercept.get(0, 0);
             for i in 0..n {
                 result.set(
                     0,
                     i,
-                    self.classes[if y_hat[i].sigmoid() > T::half() { 1 } else { 0 }],
+                    self.classes[if (y_hat[i] + intercept).sigmoid() > T::half() {
+                        1
+                    } else {
+                        0
+                    }],
                 );
             }
         } else {
-            let (nrows, _) = x.shape();
-            let x_and_bias = x.h_stack(&M::ones(nrows, 1));
-            let y_hat = x_and_bias.matmul(&self.weights.transpose());
+            let mut y_hat = x.matmul(&self.coefficients.transpose());
+            for r in 0..n {
+                for c in 0..self.num_classes {
+                    y_hat.set(r, c, y_hat.get(r, c) + self.intercept.get(c, 0));
+                }
+            }
             let class_idxs = y_hat.argmax();
             for i in 0..n {
                 result.set(0, i, self.classes[class_idxs[i]]);
@@ -307,17 +316,13 @@ impl<T: RealNumber, M: Matrix<T>> LogisticRegression<T, M> {
     }
 
     /// Get estimates regression coefficients
-    pub fn coefficients(&self) -> M {
-        self.weights
-            .slice(0..self.num_classes, 0..self.num_attributes)
+    pub fn coefficients(&self) -> &M {
+        &self.coefficients
     }
 
     /// Get estimate of intercept
-    pub fn intercept(&self) -> M {
-        self.weights.slice(
-            0..self.num_classes,
-            self.num_attributes..self.num_attributes + 1,
-        )
+    pub fn intercept(&self) -> &M {
+        &self.intercept
     }
 
     fn minimize(x0: M, objective: impl ObjectiveFunction<T, M>) -> OptimizerResult<T, M> {
@@ -336,7 +341,9 @@ impl<T: RealNumber, M: Matrix<T>> LogisticRegression<T, M> {
 #[cfg(test)]
 mod tests {
     use super::*;
+    use crate::dataset::generator::make_blobs;
     use crate::linalg::naive::dense_matrix::*;
+    use crate::metrics::accuracy;
 
     #[test]
     fn multiclass_objective_f() {
@@ -466,6 +473,34 @@ mod tests {
         );
     }
 
+    #[test]
+    fn lr_fit_predict_multiclass() {
+        let blobs = make_blobs(15, 4, 3);
+
+        let x = DenseMatrix::from_vec(15, 4, &blobs.data);
+        let y = blobs.target;
+
+        let lr = LogisticRegression::fit(&x, &y).unwrap();
+
+        let y_hat = lr.predict(&x).unwrap();
+
+        assert!(accuracy(&y_hat, &y) > 0.9);
+    }
+
+    #[test]
+    fn lr_fit_predict_binary() {
+        let blobs = make_blobs(20, 4, 2);
+
+        let x = DenseMatrix::from_vec(20, 4, &blobs.data);
+        let y = blobs.target;
+
+        let lr = LogisticRegression::fit(&x, &y).unwrap();
+
+        let y_hat = lr.predict(&x).unwrap();
+
+        assert!(accuracy(&y_hat, &y) > 0.9);
+    }
+
     #[test]
     fn serde() {
         let x = DenseMatrix::from_2d_array(&[
diff --git a/src/linear/ridge_regression.rs b/src/linear/ridge_regression.rs
@@ -134,6 +134,10 @@ impl<T: RealNumber, M: Matrix<T>> RidgeRegression<T, M> {
             )));
         }
 
+        if y.len() != n {
+            return Err(Failed::fit(&format!("Number of rows in X should = len(y)")));
+        }
+
         let y_column = M::from_row_vector(y.clone()).transpose();
 
         let (w, b) = if parameters.normalize {
@@ -216,8 +220,8 @@ impl<T: RealNumber, M: Matrix<T>> RidgeRegression<T, M> {
     }
 
     /// Get estimates regression coefficients
-    pub fn coefficients(&self) -> M {
-        self.coefficients.clone()
+    pub fn coefficients(&self) -> &M {
+        &self.coefficients
     }
 
     /// Get estimate of intercept

Original file line number	Diff line number	Diff line change
`@@ -154,8 +154,8 @@ impl<T: RealNumber, M: Matrix<T>> LinearRegression<T, M> {`
`154`	`154`	`}`
`155`	`155`
`156`	`156`	`/// Get estimates regression coefficients`
`157`		`- pub fn coefficients(&self) -> M {`
`158`		`- self.coefficients.clone()`
	`157`	`+ pub fn coefficients(&self) -> &M {`
	`158`	`+ &self.coefficients`
`159`	`159`	`}`
`160`	`160`
`161`	`161`	`/// Get estimate of intercept`
Original file line number	Diff line number	Diff line change
`@@ -134,6 +134,10 @@ impl<T: RealNumber, M: Matrix<T>> RidgeRegression<T, M> {`
`134`	`134`	`)));`
`135`	`135`	`}`
`136`	`136`
	`137`	`+ if y.len() != n {`
	`138`	`+ return Err(Failed::fit(&format!("Number of rows in X should = len(y)")));`
	`139`	`+ }`
	`140`	`+`
`137`	`141`	`let y_column = M::from_row_vector(y.clone()).transpose();`
`138`	`142`
`139`	`143`	`let (w, b) = if parameters.normalize {`
`@@ -216,8 +220,8 @@ impl<T: RealNumber, M: Matrix<T>> RidgeRegression<T, M> {`
`216`	`220`	`}`
`217`	`221`
`218`	`222`	`/// Get estimates regression coefficients`
`219`		`- pub fn coefficients(&self) -> M {`
`220`		`- self.coefficients.clone()`
	`223`	`+ pub fn coefficients(&self) -> &M {`
	`224`	`+ &self.coefficients`
`221`	`225`	`}`
`222`	`226`
`223`	`227`	`/// Get estimate of intercept`