From 2605bf38168b75f87d125091356af9673ad27fb1 Mon Sep 17 00:00:00 2001
From: meliurwen <meliurwen@gmail.com>
Date: Wed, 11 May 2022 22:24:17 +0200
Subject: [PATCH 1/3] Implemented part of matrices comparison in chi square

---
 Cargo.toml                                    |   3 +-
 src/parameter_learning.rs                     |  17 +++
 src/structure_learning.rs                     |   2 +
 .../constraint_based_algorithm.rs             |   5 +
 src/structure_learning/hypothesis_test.rs     | 101 ++++++++++++++++++
 tests/structure_learning.rs                   |  23 ++++
 6 files changed, 149 insertions(+), 2 deletions(-)
 create mode 100644 src/structure_learning/constraint_based_algorithm.rs
 create mode 100644 src/structure_learning/hypothesis_test.rs
diff --git a/Cargo.toml b/Cargo.toml
index 4779b47..56d0452 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -6,8 +6,7 @@ edition = "2021"
 # See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
 
 [dependencies]
-
-ndarray = {version="*", features=["approx"]}
+ndarray = {version="*", features=["approx-0_5"]}
 thiserror = "*"
 rand = "*"
 bimap = "*"
diff --git a/src/parameter_learning.rs b/src/parameter_learning.rs
index 5270d9e..19c0e4c 100644
--- a/src/parameter_learning.rs
+++ b/src/parameter_learning.rs
@@ -153,3 +153,20 @@ impl ParameterLearning for BayesianApproach {
         return (CIM, M, T);
     }
 }
+
+
+pub struct Cache<P: ParameterLearning> {
+    parameter_learning: P,
+}
+
+impl<P: ParameterLearning> Cache<P> {
+    pub fn fit<T:network::Network>(
+        &mut self,
+        net: &T,
+        dataset: &tools::Dataset,
+        node: usize,
+        parent_set: Option<BTreeSet<usize>>,
+    ) -> (Array3<f64>, Array3<usize>, Array2<f64>) {
+        self.parameter_learning.fit(net, dataset, node, parent_set)
+    }
+}
diff --git a/src/structure_learning.rs b/src/structure_learning.rs
index 8ba91df..b7db7ed 100644
--- a/src/structure_learning.rs
+++ b/src/structure_learning.rs
@@ -1,5 +1,7 @@
 pub mod score_function;
 pub mod score_based_algorithm;
+pub mod constraint_based_algorithm;
+pub mod hypothesis_test;
 use crate::network;
 use crate::tools;
 
diff --git a/src/structure_learning/constraint_based_algorithm.rs b/src/structure_learning/constraint_based_algorithm.rs
new file mode 100644
index 0000000..0d8b655
--- /dev/null
+++ b/src/structure_learning/constraint_based_algorithm.rs
@@ -0,0 +1,5 @@
+
+//pub struct CTPC {
+//
+//}
+
diff --git a/src/structure_learning/hypothesis_test.rs b/src/structure_learning/hypothesis_test.rs
new file mode 100644
index 0000000..fc5c86f
--- /dev/null
+++ b/src/structure_learning/hypothesis_test.rs
@@ -0,0 +1,101 @@
+use ndarray::Array2;
+use ndarray::Array3;
+use ndarray::Axis;
+
+use crate::network;
+use crate::parameter_learning;
+use std::collections::BTreeSet;
+
+pub trait HypothesisTest {
+
+    fn call<T, P>(
+        &self,
+        net: &T,
+        child_node: usize,
+        parent_node: usize,
+        separation_set: &BTreeSet<usize>,
+        cache: parameter_learning::Cache<P>
+    ) -> bool
+    where
+        T: network::Network,
+        P: parameter_learning::ParameterLearning;
+
+}
+
+
+pub struct ChiSquare {
+    pub alpha: f64,
+}
+
+pub struct F {
+
+}
+
+impl ChiSquare {
+    pub fn compare_matrices(
+        &self, i: usize,
+        M1: &Array3<usize>,
+        j: usize,
+        M2: &Array3<usize>
+    ) -> bool {
+        // Bregoli, A., Scutari, M. and Stella, F., 2021.
+        // A constraint-based algorithm for the structural learning of
+        // continuous-time Bayesian networks.
+        // International Journal of Approximate Reasoning, 138, pp.105-122.
+        //
+        // M  = M            M  = M
+        //  1    xx'|s        2    xx'|y,s
+        let M1 = M1.index_axis(Axis(0), i).mapv(|x| x as f64);
+        let M2 = M2.index_axis(Axis(0), j).mapv(|x| x as f64);
+        //                   __________________
+        //                  /    ===
+        //                 /     \       M
+        //                /      /        xx'|s
+        //               /       ===
+        //              /    x'ϵVal /X \
+        //             /            \ i/                  1
+        //K =         /      ------------------       L = -
+        //           /           ===                      K
+        //          /            \       M
+        //         /             /        xx'|y,s
+        //        /              ===
+        //       /           x'ϵVal /X \
+        //   \  /                   \ i/
+        //    \/
+        let K = M1.sum_axis(Axis(1)) / M2.sum_axis(Axis(1));
+        let K = K.mapv(f64::sqrt);
+        // Reshape to column vector.
+        let K = {
+            let n = K.len();
+            K.into_shape((n, 1)).unwrap()
+        };
+        let L = 1.0 / &K;
+        //        =====
+        //         \       K . M  - L . M
+        //          \           2        1
+        //          /      ---------------
+        //         /           M  + M
+        //        =====         2    1
+        //     x'ϵVal /X \
+        //            \ i/
+        let X_2 = (( K * &M2 - L * &M1 ).mapv(|a| a.powi(2)) / (&M2 + &M1)).sum_axis(Axis(1));
+        println!("X_2: {:?}", X_2); 
+        true
+    }
+}
+
+impl HypothesisTest for ChiSquare {
+    fn call<T, P>(
+        &self,
+        net: &T,
+        child_node: usize,
+        parent_node: usize,
+        separation_set: &BTreeSet<usize>,
+        cache: parameter_learning::Cache<P>
+    ) -> bool
+    where
+        T: network::Network,
+        P: parameter_learning::ParameterLearning {
+        todo!()
+    }
+}
diff --git a/tests/structure_learning.rs b/tests/structure_learning.rs
index c91f508..be9c8d5 100644
--- a/tests/structure_learning.rs
+++ b/tests/structure_learning.rs
@@ -7,6 +7,7 @@ use reCTBN::network::Network;
 use reCTBN::params;
 use reCTBN::structure_learning::score_function::*;
 use reCTBN::structure_learning::{score_based_algorithm::*, StructureLearningAlgorithm};
+use reCTBN::structure_learning::hypothesis_test::*;
 use reCTBN::tools::*;
 use std::collections::BTreeSet;
 
@@ -315,3 +316,25 @@ pub fn learn_mixed_discrete_net_3_nodes_hill_climbing_bic_1_parent_constraint()
     let hl = HillClimbing::new(bic, Some(1));
     learn_mixed_discrete_net_3_nodes_1_parent_constraint(hl);
 }
+
+#[test]
+pub fn chi_square_compare_matrices () {
+    let i: usize = 1;
+    let M1 = arr3(&[
+       [[ 1,  2,  3],
+        [ 4,  5,  6]],
+       [[ 22,  12,  90],
+        [3, 20, 40]],
+        [[ 1,  2,  3],
+        [ 4,  5,  6]],
+       [[ 7,  8,  9],
+        [10, 11, 12]]
+    ]);
+    let j: usize = 1;
+    let M2 = arr3(&[[[ 1,  2,  3],     // -- 2 rows  \_
+        [ 4,  5,  6]],
+       [[ 7,  8,  9],
+        [10, 11, 12]]]);
+    let chi_sq = ChiSquare {alpha: 0.5};
+    chi_sq.compare_matrices( i, &M1, j, &M2);
+}

From 4b35ae63101394a47afbd22e397830f6043b7027 Mon Sep 17 00:00:00 2001
From: meliurwen <meliurwen@gmail.com>
Date: Thu, 19 May 2022 13:47:39 +0200
Subject: [PATCH 2/3] Implemented matrices comparison function in chi square

---
 Cargo.toml                                |  2 +-
 src/structure_learning/hypothesis_test.rs | 28 ++++++--
 tests/structure_learning.rs               | 80 ++++++++++++++++++-----
 3 files changed, 88 insertions(+), 22 deletions(-)

diff --git a/Cargo.toml b/Cargo.toml
index 56d0452..553e294 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -6,7 +6,7 @@ edition = "2021"
 # See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
 
 [dependencies]
-ndarray = {version="*", features=["approx-0_5"]}
+ndarray = {version="*", features=["approx"]}
 thiserror = "*"
 rand = "*"
 bimap = "*"
diff --git a/src/structure_learning/hypothesis_test.rs b/src/structure_learning/hypothesis_test.rs
index fc5c86f..6e06721 100644
--- a/src/structure_learning/hypothesis_test.rs
+++ b/src/structure_learning/hypothesis_test.rs
@@ -1,6 +1,7 @@
 use ndarray::Array2;
 use ndarray::Array3;
 use ndarray::Axis;
+use statrs::distribution::{ChiSquared, ContinuousCDF};
 
 use crate::network;
 use crate::parameter_learning;
@@ -24,7 +25,7 @@ pub trait HypothesisTest {
 
 
 pub struct ChiSquare {
-    pub alpha: f64,
+    alpha: f64,
 }
 
 pub struct F {
@@ -32,6 +33,11 @@ pub struct F {
 }
 
 impl ChiSquare {
+    pub fn new( alpha: f64) -> ChiSquare {
+        ChiSquare {
+            alpha
+        }
+    }
     pub fn compare_matrices(
         &self, i: usize,
         M1: &Array3<usize>,
@@ -42,6 +48,7 @@ impl ChiSquare {
         // A constraint-based algorithm for the structural learning of
         // continuous-time Bayesian networks.
         // International Journal of Approximate Reasoning, 138, pp.105-122.
+        // Also: https://www.itl.nist.gov/div898/software/dataplot/refman1/auxillar/chi2samp.htm
         //
         // M  = M            M  = M
         //  1    xx'|s        2    xx'|y,s
@@ -70,17 +77,26 @@ impl ChiSquare {
             K.into_shape((n, 1)).unwrap()
         };
         let L = 1.0 / &K;
-        //        =====
-        //         \       K . M  - L . M
+        //        =====                   2
+        //         \      (K . M  - L . M)
         //          \           2        1
         //          /      ---------------
         //         /           M  + M
         //        =====         2    1
         //     x'ϵVal /X \
         //            \ i/
-        let X_2 = (( K * &M2 - L * &M1 ).mapv(|a| a.powi(2)) / (&M2 + &M1)).sum_axis(Axis(1));
-        println!("X_2: {:?}", X_2); 
-        true
+        let mut X_2 = ( &K * &M2 - &L * &M1 ).mapv(|a| a.powi(2)) / (&M2 + &M1);
+        println!("M1: {:?}", M1);
+        println!("M2: {:?}", M2);
+        println!("L*M1: {:?}", (L * &M1));
+        println!("K*M2: {:?}", (K * &M2));
+        println!("X_2: {:?}", X_2);
+        X_2.diag_mut().fill(0.0);
+        let X_2 = X_2.sum_axis(Axis(1));
+        let n = ChiSquared::new((X_2.dim() - 1) as f64).unwrap();
+        println!("CHI^2: {:?}", n);
+        println!("CHI^2 CDF: {:?}", X_2.mapv(|x| n.cdf(x)));
+        X_2.into_iter().all(|x| n.cdf(x) < (1.0 - self.alpha))
     }
 }
 
diff --git a/tests/structure_learning.rs b/tests/structure_learning.rs
index be9c8d5..2c9645b 100644
--- a/tests/structure_learning.rs
+++ b/tests/structure_learning.rs
@@ -321,20 +321,70 @@ pub fn learn_mixed_discrete_net_3_nodes_hill_climbing_bic_1_parent_constraint()
 pub fn chi_square_compare_matrices () {
     let i: usize = 1;
     let M1 = arr3(&[
-       [[ 1,  2,  3],
-        [ 4,  5,  6]],
-       [[ 22,  12,  90],
-        [3, 20, 40]],
-        [[ 1,  2,  3],
-        [ 4,  5,  6]],
-       [[ 7,  8,  9],
-        [10, 11, 12]]
+       [[ 0,  2,  3],
+        [ 4,  0,  6],
+        [ 7,  8,  0]],
+       [[0, 12,  90],
+        [ 3, 0,  40],
+        [ 6, 40,  0]],
+       [[ 0,  2,  3],
+        [ 4,  0,  6],
+        [ 44, 66, 0]]
     ]);
-    let j: usize = 1;
-    let M2 = arr3(&[[[ 1,  2,  3],     // -- 2 rows  \_
-        [ 4,  5,  6]],
-       [[ 7,  8,  9],
-        [10, 11, 12]]]);
-    let chi_sq = ChiSquare {alpha: 0.5};
-    chi_sq.compare_matrices( i, &M1, j, &M2);
+    let j: usize = 0;
+    let M2 = arr3(&[
+       [[ 0,  200,  300],
+        [ 400,  0,  600],
+        [  700, 800,  0]]
+    ]);
+    let chi_sq = ChiSquare::new(0.1);
+    assert!(!chi_sq.compare_matrices( i, &M1, j, &M2));
+}
+
+#[test]
+pub fn chi_square_compare_matrices_2 () {
+    let i: usize = 1;
+    let M1 = arr3(&[
+       [[ 0,  2,  3],
+        [ 4,  0,  6],
+        [ 7,  8,  0]],
+       [[0, 20,  30],
+        [ 40, 0,  60],
+        [ 70, 80,  0]],
+       [[ 0,  2,  3],
+        [ 4,  0,  6],
+        [ 44, 66, 0]]
+    ]);
+    let j: usize = 0;
+    let M2 = arr3(&[
+       [[ 0,  200,  300],
+        [ 400,  0,  600],
+        [  700, 800,  0]]
+    ]);
+    let chi_sq = ChiSquare::new(0.1);
+    assert!(chi_sq.compare_matrices( i, &M1, j, &M2));
+}
+
+#[test]
+pub fn chi_square_compare_matrices_3 () {
+    let i: usize = 1;
+    let M1 = arr3(&[
+       [[ 0,  2,  3],
+        [ 4,  0,  6],
+        [ 7,  8,  0]],
+       [[0, 21,  31],
+        [ 41, 0,  59],
+        [ 71, 79,  0]],
+       [[ 0,  2,  3],
+        [ 4,  0,  6],
+        [ 44, 66, 0]]
+    ]);
+    let j: usize = 0;
+    let M2 = arr3(&[
+       [[ 0,  200,  300],
+        [ 400,  0,  600],
+        [  700, 800,  0]]
+    ]);
+    let chi_sq = ChiSquare::new(0.1);
+    assert!(chi_sq.compare_matrices( i, &M1, j, &M2));
 }

From 68ada89c0419af88eeca13541664b7799f76141f Mon Sep 17 00:00:00 2001
From: meliurwen <meliurwen@gmail.com>
Date: Mon, 13 Jun 2022 13:27:42 +0200
Subject: [PATCH 3/3] Expanded Hypothesis test

---
 src/parameter_learning.rs                 |  4 ++--
 src/structure_learning/hypothesis_test.rs | 26 +++++++++++++++++++----
 2 files changed, 24 insertions(+), 6 deletions(-)

diff --git a/src/parameter_learning.rs b/src/parameter_learning.rs
index 19c0e4c..6fff9d1 100644
--- a/src/parameter_learning.rs
+++ b/src/parameter_learning.rs
@@ -157,16 +157,16 @@ impl ParameterLearning for BayesianApproach {
 
 pub struct Cache<P: ParameterLearning> {
     parameter_learning: P,
+    dataset: tools::Dataset,
 }
 
 impl<P: ParameterLearning> Cache<P> {
     pub fn fit<T:network::Network>(
         &mut self,
         net: &T,
-        dataset: &tools::Dataset,
         node: usize,
         parent_set: Option<BTreeSet<usize>>,
     ) -> (Array3<f64>, Array3<usize>, Array2<f64>) {
-        self.parameter_learning.fit(net, dataset, node, parent_set)
+        self.parameter_learning.fit(net, &self.dataset, node, parent_set)
     }
 }
diff --git a/src/structure_learning/hypothesis_test.rs b/src/structure_learning/hypothesis_test.rs
index 6e06721..86500e5 100644
--- a/src/structure_learning/hypothesis_test.rs
+++ b/src/structure_learning/hypothesis_test.rs
@@ -5,6 +5,7 @@ use statrs::distribution::{ChiSquared, ContinuousCDF};
 
 use crate::network;
 use crate::parameter_learning;
+use crate::params::ParamsTrait;
 use std::collections::BTreeSet;
 
 pub trait HypothesisTest {
@@ -15,7 +16,7 @@ pub trait HypothesisTest {
         child_node: usize,
         parent_node: usize,
         separation_set: &BTreeSet<usize>,
-        cache: parameter_learning::Cache<P>
+        cache: &mut parameter_learning::Cache<P>
     ) -> bool
     where
         T: network::Network,
@@ -39,7 +40,8 @@ impl ChiSquare {
         }
     }
     pub fn compare_matrices(
-        &self, i: usize,
+        &self,
+        i: usize,
         M1: &Array3<usize>,
         j: usize,
         M2: &Array3<usize>
@@ -107,11 +109,27 @@ impl HypothesisTest for ChiSquare {
         child_node: usize,
         parent_node: usize,
         separation_set: &BTreeSet<usize>,
-        cache: parameter_learning::Cache<P>
+        cache: &mut parameter_learning::Cache<P>
     ) -> bool
     where
         T: network::Network,
         P: parameter_learning::ParameterLearning {
-        todo!()
+        // Prendo dalla cache l'apprendimento dei parametri, che sarebbe una CIM
+        // di dimensione nxn
+        //  (CIM, M, T)
+        let ( _, M_small, _) = cache.fit(net, child_node, Some(separation_set.clone()));
+        // 
+        let mut extended_separation_set = separation_set.clone();
+        extended_separation_set.insert(parent_node);
+        let ( _, M_big, _) = cache.fit(net, child_node, Some(extended_separation_set.clone()));
+        // Commentare qui
+        let partial_cardinality_product:usize = extended_separation_set.iter().take_while(|x| **x != parent_node).map(|x| net.get_node(*x).get_reserved_space_as_parent()).product();
+        for idx_M_big in 0..M_big.shape()[0] {
+            let idx_M_small: usize = idx_M_big%partial_cardinality_product + (idx_M_big/(partial_cardinality_product*net.get_node(parent_node).get_reserved_space_as_parent()))*partial_cardinality_product;
+            if ! self.compare_matrices(idx_M_small, &M_small, idx_M_big, &M_big) {
+                return false;
+            }
+        }
+        return true;
     }
 }