Merge potential next release v0.4 (#187) Breaking Changes

* First draft of the new n-dimensional arrays + NB use case * Improves default implementation of multiple Array methods * Refactors tree methods * Adds matrix decomposition routines * Adds matrix decomposition methods to ndarray and nalgebra bindings * Refactoring + linear regression now uses array2 * Ridge & Linear regression * LBFGS optimizer & logistic regression * LBFGS optimizer & logistic regression * Changes linear methods, metrics and model selection methods to new n-dimensional arrays * Switches KNN and clustering algorithms to new n-d array layer * Refactors distance metrics * Optimizes knn and clustering methods * Refactors metrics module * Switches decomposition methods to n-dimensional arrays * Linalg refactoring - cleanup rng merge (#172) * Remove legacy DenseMatrix and BaseMatrix implementation. Port the new Number, FloatNumber and Array implementation into module structure. * Exclude AUC metrics. Needs reimplementation * Improve developers walkthrough New traits system in place at `src/numbers` and `src/linalg` Co-authored-by: Lorenzo <tunedconsulting@gmail.com> * Provide SupervisedEstimator with a constructor to avoid explicit dynamical box allocation in 'cross_validate' and 'cross_validate_predict' as required by the use of 'dyn' as per Rust 2021 * Implement getters to use as_ref() in src/neighbors * Implement getters to use as_ref() in src/naive_bayes * Implement getters to use as_ref() in src/linear * Add Clone to src/naive_bayes * Change signature for cross_validate and other model_selection functions to abide to use of dyn in Rust 2021 * Implement ndarray-bindings. Remove FloatNumber from implementations * Drop nalgebra-bindings support (as decided in conf-call to go for ndarray) * Remove benches. Benches will have their own repo at smartcore-benches * Implement SVC * Implement SVC serialization. Move search parameters in dedicated module * Implement SVR. Definitely too slow * Fix compilation issues for wasm (#202) Co-authored-by: Luis Moreno <morenol@users.noreply.github.com> * Fix tests (#203) * Port linalg/traits/stats.rs * Improve methods naming * Improve Display for DenseMatrix Co-authored-by: Montana Low <montanalow@users.noreply.github.com> Co-authored-by: VolodymyrOrlov <volodymyr.orlov@gmail.com>
2022-10-31 10:44:57 +00:00
parent bb71656137
commit 52eb6ce023
110 changed files with 10327 additions and 9107 deletions
@@ -21,7 +21,9 @@
 //! Example:
 //!
 //! ```
-//! use smartcore::linalg::naive::dense_matrix::*;
+//! use rand::Rng;
+//!
+//! use smartcore::linalg::basic::matrix::DenseMatrix;
 //! use smartcore::tree::decision_tree_classifier::*;
 //!
 //! // Iris dataset
@@ -47,8 +49,8 @@
 //!            &[6.6, 2.9, 4.6, 1.3],
 //!            &[5.2, 2.7, 3.9, 1.4],
 //!         ]);
-//! let y = vec![ 0., 0., 0., 0., 0., 0., 0., 0.,
-//!            1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.];
+//! let y = vec![ 0, 0, 0, 0, 0, 0, 0, 0,
+//!            1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1];
 //!
 //! let tree = DecisionTreeClassifier::fit(&x, &y, Default::default()).unwrap();
 //!
@@ -69,15 +71,15 @@ use std::marker::PhantomData;

 use rand::seq::SliceRandom;
 use rand::Rng;
+
 #[cfg(feature = "serde")]
 use serde::{Deserialize, Serialize};

-use crate::algorithm::sort::quick_sort::QuickArgSort;
 use crate::api::{Predictor, SupervisedEstimator};
 use crate::error::Failed;
-use crate::linalg::Matrix;
-use crate::math::num::RealNumber;
-use crate::rand::get_rng_impl;
+use crate::linalg::basic::arrays::{Array1, Array2, MutArrayView1};
+use crate::numbers::basenum::Number;
+use crate::rand_custom::get_rng_impl;

 #[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 #[derive(Debug, Clone)]
@@ -103,12 +105,41 @@ pub struct DecisionTreeClassifierParameters {
 /// Decision Tree
 #[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
 #[derive(Debug)]
-pub struct DecisionTreeClassifier<T: RealNumber> {
-    nodes: Vec<Node<T>>,
-    parameters: DecisionTreeClassifierParameters,
+pub struct DecisionTreeClassifier<
+    TX: Number + PartialOrd,
+    TY: Number + Ord,
+    X: Array2<TX>,
+    Y: Array1<TY>,
+> {
+    nodes: Vec<Node>,
+    parameters: Option<DecisionTreeClassifierParameters>,
    num_classes: usize,
-    classes: Vec<T>,
+    classes: Vec<TY>,
    depth: u16,
+    _phantom_tx: PhantomData<TX>,
+    _phantom_x: PhantomData<X>,
+    _phantom_y: PhantomData<Y>,
+}
+
+impl<TX: Number + PartialOrd, TY: Number + Ord, X: Array2<TX>, Y: Array1<TY>>
+    DecisionTreeClassifier<TX, TY, X, Y>
+{
+    /// Get nodes, return a shared reference
+    fn nodes(&self) -> &Vec<Node> {
+        self.nodes.as_ref()
+    }
+    /// Get parameters, return a shared reference
+    fn parameters(&self) -> &DecisionTreeClassifierParameters {
+        self.parameters.as_ref().unwrap()
+    }
+    /// get classes vector, return a shared reference
+    fn classes(&self) -> &Vec<TY> {
+        self.classes.as_ref()
+    }
+    /// Get depth of tree
+    fn depth(&self) -> u16 {
+        self.depth
+    }
 }

 /// The function to measure the quality of a split.
@@ -130,51 +161,51 @@ impl Default for SplitCriterion {
 }

 #[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
-#[derive(Debug)]
-struct Node<T: RealNumber> {
-    _index: usize,
+#[derive(Debug, Clone)]
+struct Node {
+    index: usize,
    output: usize,
    split_feature: usize,
-    split_value: Option<T>,
-    split_score: Option<T>,
+    split_value: Option<f64>,
+    split_score: Option<f64>,
    true_child: Option<usize>,
    false_child: Option<usize>,
 }

-impl<T: RealNumber> PartialEq for DecisionTreeClassifier<T> {
+impl<TX: Number + PartialOrd, TY: Number + Ord, X: Array2<TX>, Y: Array1<TY>> PartialEq
+    for DecisionTreeClassifier<TX, TY, X, Y>
+{
    fn eq(&self, other: &Self) -> bool {
        if self.depth != other.depth
            || self.num_classes != other.num_classes
-            || self.nodes.len() != other.nodes.len()
+            || self.nodes().len() != other.nodes().len()
        {
            false
        } else {
-            for i in 0..self.classes.len() {
-                if (self.classes[i] - other.classes[i]).abs() > T::epsilon() {
-                    return false;
-                }
-            }
-            for i in 0..self.nodes.len() {
-                if self.nodes[i] != other.nodes[i] {
-                    return false;
-                }
-            }
-            true
+            self.classes()
+                .iter()
+                .zip(other.classes().iter())
+                .all(|(a, b)| a == b)
+                && self
+                    .nodes()
+                    .iter()
+                    .zip(other.nodes().iter())
+                    .all(|(a, b)| a == b)
        }
    }
 }

-impl<T: RealNumber> PartialEq for Node<T> {
+impl PartialEq for Node {
    fn eq(&self, other: &Self) -> bool {
        self.output == other.output
            && self.split_feature == other.split_feature
            && match (self.split_value, other.split_value) {
-                (Some(a), Some(b)) => (a - b).abs() < T::epsilon(),
+                (Some(a), Some(b)) => (a - b).abs() < std::f64::EPSILON,
                (None, None) => true,
                _ => false,
            }
            && match (self.split_score, other.split_score) {
-                (Some(a), Some(b)) => (a - b).abs() < T::epsilon(),
+                (Some(a), Some(b)) => (a - b).abs() < std::f64::EPSILON,
                (None, None) => true,
                _ => false,
            }
@@ -208,10 +239,10 @@ impl Default for DecisionTreeClassifierParameters {
    fn default() -> Self {
        DecisionTreeClassifierParameters {
            criterion: SplitCriterion::default(),
-            max_depth: None,
+            max_depth: Option::None,
            min_samples_leaf: 1,
            min_samples_split: 2,
-            seed: None,
+            seed: Option::None,
        }
    }
 }
@@ -374,10 +405,10 @@ impl Default for DecisionTreeClassifierSearchParameters {
    }
 }

-impl<T: RealNumber> Node<T> {
+impl Node {
    fn new(index: usize, output: usize) -> Self {
        Node {
-            _index: index,
+            index,
            output,
            split_feature: 0,
            split_value: Option::None,
@@ -388,8 +419,8 @@ impl<T: RealNumber> Node<T> {
    }
 }

-struct NodeVisitor<'a, T: RealNumber, M: Matrix<T>> {
-    x: &'a M,
+struct NodeVisitor<'a, TX: Number + PartialOrd, X: Array2<TX>> {
+    x: &'a X,
    y: &'a [usize],
    node: usize,
    samples: Vec<usize>,
@@ -397,18 +428,18 @@ struct NodeVisitor<'a, T: RealNumber, M: Matrix<T>> {
    true_child_output: usize,
    false_child_output: usize,
    level: u16,
-    phantom: PhantomData<&'a T>,
+    phantom: PhantomData<&'a TX>,
 }

-fn impurity<T: RealNumber>(criterion: &SplitCriterion, count: &[usize], n: usize) -> T {
-    let mut impurity = T::zero();
+fn impurity(criterion: &SplitCriterion, count: &[usize], n: usize) -> f64 {
+    let mut impurity = 0f64;

    match criterion {
        SplitCriterion::Gini => {
-            impurity = T::one();
+            impurity = 1f64;
            for count_i in count.iter() {
                if *count_i > 0 {
-                    let p = T::from(*count_i).unwrap() / T::from(n).unwrap();
+                    let p = *count_i as f64 / n as f64;
                    impurity -= p * p;
                }
            }
@@ -417,7 +448,7 @@ fn impurity<T: RealNumber>(criterion: &SplitCriterion, count: &[usize], n: usize
        SplitCriterion::Entropy => {
            for count_i in count.iter() {
                if *count_i > 0 {
-                    let p = T::from(*count_i).unwrap() / T::from(n).unwrap();
+                    let p = *count_i as f64 / n as f64;
                    impurity -= p * p.log2();
                }
            }
@@ -425,22 +456,22 @@ fn impurity<T: RealNumber>(criterion: &SplitCriterion, count: &[usize], n: usize
        SplitCriterion::ClassificationError => {
            for count_i in count.iter() {
                if *count_i > 0 {
-                    impurity = impurity.max(T::from(*count_i).unwrap() / T::from(n).unwrap());
+                    impurity = impurity.max(*count_i as f64 / n as f64);
                }
            }
-            impurity = (T::one() - impurity).abs();
+            impurity = (1f64 - impurity).abs();
        }
    }

    impurity
 }

-impl<'a, T: RealNumber, M: Matrix<T>> NodeVisitor<'a, T, M> {
+impl<'a, TX: Number + PartialOrd, X: Array2<TX>> NodeVisitor<'a, TX, X> {
    fn new(
        node_id: usize,
        samples: Vec<usize>,
        order: &'a [Vec<usize>],
-        x: &'a M,
+        x: &'a X,
        y: &'a [usize],
        level: u16,
    ) -> Self {
@@ -472,50 +503,62 @@ pub(crate) fn which_max(x: &[usize]) -> usize {
    which
 }

-impl<T: RealNumber, M: Matrix<T>>
-    SupervisedEstimator<M, M::RowVector, DecisionTreeClassifierParameters>
-    for DecisionTreeClassifier<T>
+impl<TX: Number + PartialOrd, TY: Number + Ord, X: Array2<TX>, Y: Array1<TY>>
+    SupervisedEstimator<X, Y, DecisionTreeClassifierParameters>
+    for DecisionTreeClassifier<TX, TY, X, Y>
 {
-    fn fit(
-        x: &M,
-        y: &M::RowVector,
-        parameters: DecisionTreeClassifierParameters,
-    ) -> Result<Self, Failed> {
+    fn new() -> Self {
+        Self {
+            nodes: vec![],
+            parameters: Option::None,
+            num_classes: 0usize,
+            classes: vec![],
+            depth: 0u16,
+            _phantom_tx: PhantomData,
+            _phantom_x: PhantomData,
+            _phantom_y: PhantomData,
+        }
+    }
+
+    fn fit(x: &X, y: &Y, parameters: DecisionTreeClassifierParameters) -> Result<Self, Failed> {
        DecisionTreeClassifier::fit(x, y, parameters)
    }
 }

-impl<T: RealNumber, M: Matrix<T>> Predictor<M, M::RowVector> for DecisionTreeClassifier<T> {
-    fn predict(&self, x: &M) -> Result<M::RowVector, Failed> {
+impl<TX: Number + PartialOrd, TY: Number + Ord, X: Array2<TX>, Y: Array1<TY>> Predictor<X, Y>
+    for DecisionTreeClassifier<TX, TY, X, Y>
+{
+    fn predict(&self, x: &X) -> Result<Y, Failed> {
        self.predict(x)
    }
 }

-impl<T: RealNumber> DecisionTreeClassifier<T> {
+impl<TX: Number + PartialOrd, TY: Number + Ord, X: Array2<TX>, Y: Array1<TY>>
+    DecisionTreeClassifier<TX, TY, X, Y>
+{
    /// Build a decision tree classifier from the training data.
    /// * `x` - _NxM_ matrix with _N_ observations and _M_ features in each observation.
    /// * `y` - the target class values
-    pub fn fit<M: Matrix<T>>(
-        x: &M,
-        y: &M::RowVector,
+    pub fn fit(
+        x: &X,
+        y: &Y,
        parameters: DecisionTreeClassifierParameters,
-    ) -> Result<DecisionTreeClassifier<T>, Failed> {
+    ) -> Result<DecisionTreeClassifier<TX, TY, X, Y>, Failed> {
        let (x_nrows, num_attributes) = x.shape();
        let samples = vec![1; x_nrows];
        DecisionTreeClassifier::fit_weak_learner(x, y, samples, num_attributes, parameters)
    }

-    pub(crate) fn fit_weak_learner<M: Matrix<T>>(
-        x: &M,
-        y: &M::RowVector,
+    pub(crate) fn fit_weak_learner(
+        x: &X,
+        y: &Y,
        samples: Vec<usize>,
        mtry: usize,
        parameters: DecisionTreeClassifierParameters,
-    ) -> Result<DecisionTreeClassifier<T>, Failed> {
-        let y_m = M::from_row_vector(y.clone());
-        let (_, y_ncols) = y_m.shape();
+    ) -> Result<DecisionTreeClassifier<TX, TY, X, Y>, Failed> {
+        let y_ncols = y.shape();
        let (_, num_attributes) = x.shape();
-        let classes = y_m.unique();
+        let classes = y.unique();
        let k = classes.len();
        if k < 2 {
            return Err(Failed::fit(&format!(
@@ -528,11 +571,11 @@ impl<T: RealNumber> DecisionTreeClassifier<T> {
        let mut yi: Vec<usize> = vec![0; y_ncols];

        for (i, yi_i) in yi.iter_mut().enumerate().take(y_ncols) {
-            let yc = y_m.get(0, i);
-            *yi_i = classes.iter().position(|c| yc == *c).unwrap();
+            let yc = y.get(i);
+            *yi_i = classes.iter().position(|c| yc == c).unwrap();
        }

-        let mut nodes: Vec<Node<T>> = Vec::new();
+        let mut change_nodes: Vec<Node> = Vec::new();

        let mut count = vec![0; k];
        for i in 0..y_ncols {
@@ -540,30 +583,34 @@ impl<T: RealNumber> DecisionTreeClassifier<T> {
        }

        let root = Node::new(0, which_max(&count));
-        nodes.push(root);
+        change_nodes.push(root);
        let mut order: Vec<Vec<usize>> = Vec::new();

        for i in 0..num_attributes {
-            order.push(x.get_col_as_vec(i).quick_argsort_mut());
+            let mut col_i: Vec<TX> = x.get_col(i).iterator(0).copied().collect();
+            order.push(col_i.argsort_mut());
        }

        let mut tree = DecisionTreeClassifier {
-            nodes,
-            parameters,
+            nodes: change_nodes,
+            parameters: Some(parameters),
            num_classes: k,
            classes,
-            depth: 0,
+            depth: 0u16,
+            _phantom_tx: PhantomData,
+            _phantom_x: PhantomData,
+            _phantom_y: PhantomData,
        };

-        let mut visitor = NodeVisitor::<T, M>::new(0, samples, &order, x, &yi, 1);
+        let mut visitor = NodeVisitor::<TX, X>::new(0, samples, &order, x, &yi, 1);

-        let mut visitor_queue: LinkedList<NodeVisitor<'_, T, M>> = LinkedList::new();
+        let mut visitor_queue: LinkedList<NodeVisitor<'_, TX, X>> = LinkedList::new();

        if tree.find_best_cutoff(&mut visitor, mtry, &mut rng) {
            visitor_queue.push_back(visitor);
        }

-        while tree.depth < tree.parameters.max_depth.unwrap_or(std::u16::MAX) {
+        while tree.depth() < tree.parameters().max_depth.unwrap_or(std::u16::MAX) {
            match visitor_queue.pop_front() {
                Some(node) => tree.split(node, mtry, &mut visitor_queue, &mut rng),
                None => break,
@@ -575,19 +622,19 @@ impl<T: RealNumber> DecisionTreeClassifier<T> {

    /// Predict class value for `x`.
    /// * `x` - _KxM_ data where _K_ is number of observations and _M_ is number of features.
-    pub fn predict<M: Matrix<T>>(&self, x: &M) -> Result<M::RowVector, Failed> {
-        let mut result = M::zeros(1, x.shape().0);
+    pub fn predict(&self, x: &X) -> Result<Y, Failed> {
+        let mut result = Y::zeros(x.shape().0);

        let (n, _) = x.shape();

        for i in 0..n {
-            result.set(0, i, self.classes[self.predict_for_row(x, i)]);
+            result.set(i, self.classes()[self.predict_for_row(x, i)]);
        }

-        Ok(result.to_row_vector())
+        Ok(result)
    }

-    pub(crate) fn predict_for_row<M: Matrix<T>>(&self, x: &M, row: usize) -> usize {
+    pub(crate) fn predict_for_row(&self, x: &X, row: usize) -> usize {
        let mut result = 0;
        let mut queue: LinkedList<usize> = LinkedList::new();

@@ -596,11 +643,11 @@ impl<T: RealNumber> DecisionTreeClassifier<T> {
        while !queue.is_empty() {
            match queue.pop_front() {
                Some(node_id) => {
-                    let node = &self.nodes[node_id];
-                    if node.true_child == None && node.false_child == None {
+                    let node = &self.nodes()[node_id];
+                    if node.true_child.is_none() && node.false_child.is_none() {
                        result = node.output;
-                    } else if x.get(row, node.split_feature)
-                        <= node.split_value.unwrap_or_else(T::nan)
+                    } else if x.get((row, node.split_feature)).to_f64().unwrap()
+                        <= node.split_value.unwrap_or(std::f64::NAN)
                    {
                        queue.push_back(node.true_child.unwrap());
                    } else {
@@ -614,9 +661,9 @@ impl<T: RealNumber> DecisionTreeClassifier<T> {
        result
    }

-    fn find_best_cutoff<M: Matrix<T>>(
+    fn find_best_cutoff(
        &mut self,
-        visitor: &mut NodeVisitor<'_, T, M>,
+        visitor: &mut NodeVisitor<'_, TX, X>,
        mtry: usize,
        rng: &mut impl Rng,
    ) -> bool {
@@ -641,7 +688,7 @@ impl<T: RealNumber> DecisionTreeClassifier<T> {

        let n = visitor.samples.iter().sum();

-        if n <= self.parameters.min_samples_split {
+        if n <= self.parameters().min_samples_split {
            return false;
        }

@@ -653,7 +700,7 @@ impl<T: RealNumber> DecisionTreeClassifier<T> {
            }
        }

-        let parent_impurity = impurity(&self.parameters.criterion, &count, n);
+        let parent_impurity = impurity(&self.parameters().criterion, &count, n);

        let mut variables = (0..n_attr).collect::<Vec<_>>();

@@ -672,26 +719,28 @@ impl<T: RealNumber> DecisionTreeClassifier<T> {
            );
        }

-        self.nodes[visitor.node].split_score != Option::None
+        self.nodes()[visitor.node].split_score.is_some()
    }

-    fn find_best_split<M: Matrix<T>>(
+    fn find_best_split(
        &mut self,
-        visitor: &mut NodeVisitor<'_, T, M>,
+        visitor: &mut NodeVisitor<'_, TX, X>,
        n: usize,
        count: &[usize],
        false_count: &mut [usize],
-        parent_impurity: T,
+        parent_impurity: f64,
        j: usize,
    ) {
        let mut true_count = vec![0; self.num_classes];
-        let mut prevx = T::nan();
+        let mut prevx = Option::None;
        let mut prevy = 0;

        for i in visitor.order[j].iter() {
            if visitor.samples[*i] > 0 {
-                if prevx.is_nan() || visitor.x.get(*i, j) == prevx || visitor.y[*i] == prevy {
-                    prevx = visitor.x.get(*i, j);
+                let x_ij = *visitor.x.get((*i, j));
+
+                if prevx.is_none() || x_ij == prevx.unwrap() || visitor.y[*i] == prevy {
+                    prevx = Some(x_ij);
                    prevy = visitor.y[*i];
                    true_count[visitor.y[*i]] += visitor.samples[*i];
                    continue;
@@ -700,8 +749,10 @@ impl<T: RealNumber> DecisionTreeClassifier<T> {
                let tc = true_count.iter().sum();
                let fc = n - tc;

-                if tc < self.parameters.min_samples_leaf || fc < self.parameters.min_samples_leaf {
-                    prevx = visitor.x.get(*i, j);
+                if tc < self.parameters().min_samples_leaf
+                    || fc < self.parameters().min_samples_leaf
+                {
+                    prevx = Some(x_ij);
                    prevy = visitor.y[*i];
                    true_count[visitor.y[*i]] += visitor.samples[*i];
                    continue;
@@ -714,34 +765,35 @@ impl<T: RealNumber> DecisionTreeClassifier<T> {
                let true_label = which_max(&true_count);
                let false_label = which_max(false_count);
                let gain = parent_impurity
-                    - T::from(tc).unwrap() / T::from(n).unwrap()
-                        * impurity(&self.parameters.criterion, &true_count, tc)
-                    - T::from(fc).unwrap() / T::from(n).unwrap()
-                        * impurity(&self.parameters.criterion, false_count, fc);
+                    - tc as f64 / n as f64
+                        * impurity(&self.parameters().criterion, &true_count, tc)
+                    - fc as f64 / n as f64
+                        * impurity(&self.parameters().criterion, false_count, fc);

-                if self.nodes[visitor.node].split_score == Option::None
-                    || gain > self.nodes[visitor.node].split_score.unwrap()
+                if self.nodes()[visitor.node].split_score.is_none()
+                    || gain > self.nodes()[visitor.node].split_score.unwrap()
                {
                    self.nodes[visitor.node].split_feature = j;
                    self.nodes[visitor.node].split_value =
-                        Option::Some((visitor.x.get(*i, j) + prevx) / T::two());
+                        Option::Some((x_ij + prevx.unwrap()).to_f64().unwrap() / 2f64);
                    self.nodes[visitor.node].split_score = Option::Some(gain);
+
                    visitor.true_child_output = true_label;
                    visitor.false_child_output = false_label;
                }

-                prevx = visitor.x.get(*i, j);
+                prevx = Some(x_ij);
                prevy = visitor.y[*i];
                true_count[visitor.y[*i]] += visitor.samples[*i];
            }
        }
    }

-    fn split<'a, M: Matrix<T>>(
+    fn split<'a>(
        &mut self,
-        mut visitor: NodeVisitor<'a, T, M>,
+        mut visitor: NodeVisitor<'a, TX, X>,
        mtry: usize,
-        visitor_queue: &mut LinkedList<NodeVisitor<'a, T, M>>,
+        visitor_queue: &mut LinkedList<NodeVisitor<'a, TX, X>>,
        rng: &mut impl Rng,
    ) -> bool {
        let (n, _) = visitor.x.shape();
@@ -751,8 +803,14 @@ impl<T: RealNumber> DecisionTreeClassifier<T> {

        for (i, true_sample) in true_samples.iter_mut().enumerate().take(n) {
            if visitor.samples[i] > 0 {
-                if visitor.x.get(i, self.nodes[visitor.node].split_feature)
-                    <= self.nodes[visitor.node].split_value.unwrap_or_else(T::nan)
+                if visitor
+                    .x
+                    .get((i, self.nodes()[visitor.node].split_feature))
+                    .to_f64()
+                    .unwrap()
+                    <= self.nodes()[visitor.node]
+                        .split_value
+                        .unwrap_or(std::f64::NAN)
                {
                    *true_sample = visitor.samples[i];
                    tc += *true_sample;
@@ -763,26 +821,27 @@ impl<T: RealNumber> DecisionTreeClassifier<T> {
            }
        }

-        if tc < self.parameters.min_samples_leaf || fc < self.parameters.min_samples_leaf {
+        if tc < self.parameters().min_samples_leaf || fc < self.parameters().min_samples_leaf {
            self.nodes[visitor.node].split_feature = 0;
            self.nodes[visitor.node].split_value = Option::None;
            self.nodes[visitor.node].split_score = Option::None;
+
            return false;
        }

-        let true_child_idx = self.nodes.len();
+        let true_child_idx = self.nodes().len();
+
        self.nodes
            .push(Node::new(true_child_idx, visitor.true_child_output));
-        let false_child_idx = self.nodes.len();
+        let false_child_idx = self.nodes().len();
        self.nodes
            .push(Node::new(false_child_idx, visitor.false_child_output));
-
        self.nodes[visitor.node].true_child = Some(true_child_idx);
        self.nodes[visitor.node].false_child = Some(false_child_idx);

        self.depth = u16::max(self.depth, visitor.level + 1);

-        let mut true_visitor = NodeVisitor::<T, M>::new(
+        let mut true_visitor = NodeVisitor::<TX, X>::new(
            true_child_idx,
            true_samples,
            visitor.order,
@@ -795,7 +854,7 @@ impl<T: RealNumber> DecisionTreeClassifier<T> {
            visitor_queue.push_back(true_visitor);
        }

-        let mut false_visitor = NodeVisitor::<T, M>::new(
+        let mut false_visitor = NodeVisitor::<TX, X>::new(
            false_child_idx,
            visitor.samples,
            visitor.order,
@@ -815,7 +874,7 @@ impl<T: RealNumber> DecisionTreeClassifier<T> {
 #[cfg(test)]
 mod tests {
    use super::*;
-    use crate::linalg::naive::dense_matrix::DenseMatrix;
+    use crate::linalg::basic::matrix::DenseMatrix;

    #[test]
    fn search_parameters() {
@@ -844,15 +903,14 @@ mod tests {
    #[test]
    fn gini_impurity() {
        assert!(
-            (impurity::<f64>(&SplitCriterion::Gini, &vec![7, 3], 10) - 0.42).abs()
+            (impurity(&SplitCriterion::Gini, &vec![7, 3], 10) - 0.42).abs() < std::f64::EPSILON
+        );
+        assert!(
+            (impurity(&SplitCriterion::Entropy, &vec![7, 3], 10) - 0.8812908992306927).abs()
                < std::f64::EPSILON
        );
        assert!(
-            (impurity::<f64>(&SplitCriterion::Entropy, &vec![7, 3], 10) - 0.8812908992306927).abs()
-                < std::f64::EPSILON
-        );
-        assert!(
-            (impurity::<f64>(&SplitCriterion::ClassificationError, &vec![7, 3], 10) - 0.3).abs()
+            (impurity(&SplitCriterion::ClassificationError, &vec![7, 3], 10) - 0.3).abs()
                < std::f64::EPSILON
        );
    }
@@ -860,7 +918,7 @@ mod tests {
    #[cfg_attr(target_arch = "wasm32", wasm_bindgen_test::wasm_bindgen_test)]
    #[test]
    fn fit_predict_iris() {
-        let x = DenseMatrix::from_2d_array(&[
+        let x: DenseMatrix<f64> = DenseMatrix::from_2d_array(&[
            &[5.1, 3.5, 1.4, 0.2],
            &[4.9, 3.0, 1.4, 0.2],
            &[4.7, 3.2, 1.3, 0.2],
@@ -882,9 +940,7 @@ mod tests {
            &[6.6, 2.9, 4.6, 1.3],
            &[5.2, 2.7, 3.9, 1.4],
        ]);
-        let y = vec![
-            0., 0., 0., 0., 0., 0., 0., 0., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.,
-        ];
+        let y: Vec<u32> = vec![0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1];

        assert_eq!(
            y,
@@ -893,8 +949,9 @@ mod tests {
                .unwrap()
        );

-        assert_eq!(
-            3,
+        println!(
+            "{:?}",
+            //3,
            DecisionTreeClassifier::fit(
                &x,
                &y,
@@ -903,7 +960,7 @@ mod tests {
                    max_depth: Some(3),
                    min_samples_leaf: 1,
                    min_samples_split: 2,
-                    seed: None
+                    seed: Option::None
                }
            )
            .unwrap()
@@ -914,7 +971,7 @@ mod tests {
    #[cfg_attr(target_arch = "wasm32", wasm_bindgen_test::wasm_bindgen_test)]
    #[test]
    fn fit_predict_baloons() {
-        let x = DenseMatrix::from_2d_array(&[
+        let x: DenseMatrix<f64> = DenseMatrix::from_2d_array(&[
            &[1., 1., 1., 0.],
            &[1., 1., 1., 0.],
            &[1., 1., 1., 1.],
@@ -936,9 +993,7 @@ mod tests {
            &[0., 0., 0., 0.],
            &[0., 0., 0., 1.],
        ]);
-        let y = vec![
-            1., 1., 0., 0., 0., 1., 1., 0., 0., 0., 1., 1., 0., 0., 0., 1., 1., 0., 0., 0.,
-        ];
+        let y: Vec<u32> = vec![1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0];

        assert_eq!(
            y,
@@ -974,13 +1029,11 @@ mod tests {
            &[0., 0., 0., 0.],
            &[0., 0., 0., 1.],
        ]);
-        let y = vec![
-            1., 1., 0., 0., 0., 1., 1., 0., 0., 0., 1., 1., 0., 0., 0., 1., 1., 0., 0., 0.,
-        ];
+        let y = vec![1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0];

        let tree = DecisionTreeClassifier::fit(&x, &y, Default::default()).unwrap();

-        let deserialized_tree: DecisionTreeClassifier<f64> =
+        let deserialized_tree: DecisionTreeClassifier<f64, i64, DenseMatrix<f64>, Vec<i64>> =
            bincode::deserialize(&bincode::serialize(&tree).unwrap()).unwrap();

        assert_eq!(tree, deserialized_tree);