Minor fixes in sliding intervals and documentation

lorenzotomada · lorenzotomada · commit b8cc36e8dd2b · 2025-06-26T10:28:29.000+02:00
diff --git a/scripts/mpi_running.py b/scripts/mpi_running.py
@@ -9,7 +9,7 @@ def parallel_eig(d, off_d, nprocs):
 
     print("inside parallel_eig")
     comm = MPI.COMM_SELF.Spawn(
-        sys.executable, args=["./parallel_tridiag_eigen.py"], maxprocs=nprocs
+        sys.executable, args=["src/pyclassify/parallel_tridiag_eigen.py"], maxprocs=nprocs
     )
     print("sending")
     comm.send(d, dest=0, tag=11)
diff --git a/src/pyclassify/cxx_utils.cpp b/src/pyclassify/cxx_utils.cpp
@@ -130,16 +130,11 @@ QR_algorithm(std::vector<double>  diag, std::vector<double>  off_diag, const dou
                     diag[0]=c*c*a_0+s*s*diag[1]-2*s*c*b_1;
                     diag[1]=c*c*diag[1]+s*s*a_0+2*s*c*b_1;
                     
-
                 }
-
             }
-
-      
         }
 
 
-
         unsigned j, k;
         for(unsigned int i=0; i<m; i++){
             c=Matrix_trigonometric[i][0];
@@ -170,8 +165,7 @@ QR_algorithm(std::vector<double>  diag, std::vector<double>  off_diag, const dou
                 Q[k]=tmp*c-Q[k+n]*s;
                 Q[k+n]=tmp*s+Q[k+n]*c;
             }
-    
-            
+         
         }
 
         iter++;
@@ -181,9 +175,7 @@ QR_algorithm(std::vector<double>  diag, std::vector<double>  off_diag, const dou
         }
     }
 
-    if(iter==max_iter){
-        std::cout<<"Converges failed"<<std::endl;
-    }
+    if(iter==max_iter) { std::cout<<"The QR method did not converge."<<std::endl; }
 
     std::vector<std::vector<double>> eig_vec(n,std::vector<double> (n, 0));
     //std::cout<<"Iteration: "<<iter<<std::endl;
@@ -210,7 +202,6 @@ Eigen_value_calculator(std::vector<double> diag, std::vector<double> off_diag, c
 
 
 
-
     std::vector<std::array<double, 2>> Matrix_trigonometric(n-1, {0, 0});
 
     unsigned int iter = 0;  
@@ -331,6 +322,12 @@ Eigen_value_calculator(std::vector<double> diag, std::vector<double> off_diag, c
 }
 
 
+/* Now we implement all the functions that are needed to solve the secular equation following the ETH lecture notes in the references. 
+ * This procedure involves defining the secular function, creating a nonlinear solver and computing the zero for each interval.
+ * Notice that the outer zero is computed using bisection as a consequence of the fact that the procedure described in the notes only ensures
+ * conergence in the inner intervals. */
+
+
 double compute_sum(
     const std::vector<double>& v,
     const std::vector<double>& d,
@@ -352,6 +349,7 @@ double compute_sum(
     return rho * sum;
 }
 
+
 void compute_Psi(
     const unsigned int i,
     const std::vector<double>& v,
@@ -362,6 +360,7 @@ void compute_Psi(
     std::function<double(double)>& dPsi_1,
     std::function<double(double)>& dPsi_2
 ) {
+    /* Function to compute the psi_s that appear in the secular function. */
     Psi_1 = [&](double x) {
         return compute_sum(v, d, x, 0, i + 1, false, rho);
     };
@@ -376,6 +375,7 @@ void compute_Psi(
     };
 }
 
+
 std::pair<double, double> find_root(
     const unsigned int i,
     const bool left_center,
@@ -385,6 +385,8 @@ std::pair<double, double> find_root(
     double lam_0,
     const double tol = 1e-15,
     const unsigned int maxiter = 100) {
+    
+    /* Function to compute the inner root in the i-th interval */	
     std::vector<double> diag = d;
     double shift;
 
@@ -435,6 +437,7 @@ double bisection(
     double b,
     const double tol,
     const unsigned int max_iter) {
+
     unsigned int iter_count = 0;
 
     while ((b - a) / 2.0 > tol) {
@@ -462,16 +465,26 @@ double compute_outer_zero(
     const double rho,
     const double interval_end,
     const double tol = 1e-14,
-    const unsigned int max_iter = 1000){
+    const unsigned int max_iter = 100){
+
+    // This function calls bisection on a sliding interval. The reason for that is to ensure that we are in the condition to be able to use bisection.
 
-    const double threshold = 1e-11;
+    double threshold = 1e-11;
     double update = 0.0;
 
-    // Compute L2 norm of v
+    // Compute L2 norm of v and use it for the update
+    
     for (size_t i = 0; i < v.size(); ++i) {
         update += v[i] * v[i];
     }
-    update = std::sqrt(update);
+    // update = std::sqrt(update); // actually we use the square of the norm to avoid having to compute the square root
+    
+    // another possibility for the update is this one (which is cheaper, but might cause troubles if the elements of d are too close to each other):
+
+    //if (rho>=0)
+    //    update = d[d.size() - 1] - d[d.size() - 2]; // cheaper than computing the norm each time
+    //else
+    //	update = d[1] - d[0]
 
     auto f = [&](double x) -> double {
         double sum = 0.0;
@@ -487,13 +500,30 @@ double compute_outer_zero(
     if (rho > 0.0) {
         a = interval_end + threshold;
         b = interval_end + 1.0;
-        while (f(a) * f(b) > 0.0) {
-            a = b;
-            b += update;
+	
+        // Ensure that f(a) has the correct sign
+        while (f(a)>0){
+            // we are on the wrong side of the zero!
+            b = a;
+            threshold = threshold*0.5;
+            a = interval_end + threshold;
         }
+            
+        while (f(a) * f(b) > 0.0) {
+                a = b;
+                b += update;
+            }
+
     } else if (rho < 0.0) {
         b = interval_end - threshold;
         a = interval_end - 1.0;
+	
+	// also in this case, ensure we are on the correct side of the zero
+        while (f(b)>0){
+            a = b;
+            threshold = threshold*0.5;
+            b = interval_end - threshold;
+        }
         while (f(a) * f(b) > 0.0) {
             b = a;
             a -= update;
@@ -787,4 +817,4 @@ PYBIND11_MODULE(cxx_utils, m) {
     m.def("Eigen_value_calculator", &Eigen_value_calculator, py::arg("diag"), py::arg("off_diag"), py::arg("tol")=1e-8, py::arg("max_iter")=5000);
     m.def("secular_solver_cxx", &secular_solver, py::arg("rho"), py::arg("d"), py::arg("v"), py::arg("indices"));
     m.def("deflate_eigenpairs_cxx", &deflateEigenpairs, py::arg("D"), py::arg("v"), py::arg("beta"), py::arg("tol_factor") = 1e-12);
-}
+}

Original file line number	Diff line number	Diff line change
`@@ -9,7 +9,7 @@ def parallel_eig(d, off_d, nprocs):`
`9`	`9`
`10`	`10`	`print("inside parallel_eig")`
`11`	`11`	`comm = MPI.COMM_SELF.Spawn(`
`12`		`- sys.executable, args=["./parallel_tridiag_eigen.py"], maxprocs=nprocs`
	`12`	`+ sys.executable, args=["src/pyclassify/parallel_tridiag_eigen.py"], maxprocs=nprocs`
`13`	`13`	`)`
`14`	`14`	`print("sending")`
`15`	`15`	`comm.send(d, dest=0, tag=11)`