Cstandardlib
diff --git a/‎source/source_estate/elecstate_print.cpp‎
Lines changed: 1 addition & 0 deletions b/‎source/source_estate/elecstate_print.cpp‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎source/source_hsolver/diago_lobpcg.cpp‎
Lines changed: 1089 additions & 0 deletions b/‎source/source_hsolver/diago_lobpcg.cpp‎
Lines changed: 1089 additions & 0 deletions
diff --git a/‎source/source_hsolver/diago_lobpcg.h‎
Lines changed: 490 additions & 0 deletions b/‎source/source_hsolver/diago_lobpcg.h‎
Lines changed: 490 additions & 0 deletions
diff --git a/‎source/source_hsolver/hsolver_pw.cpp‎
Lines changed: 55 additions & 1 deletion b/‎source/source_hsolver/hsolver_pw.cpp‎
Lines changed: 55 additions & 1 deletion
diff --git a/‎source/source_hsolver/test/CMakeLists.txt‎
Lines changed: 2 additions & 2 deletions b/‎source/source_hsolver/test/CMakeLists.txt‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎source/source_hsolver/test/diago_lobpcg_simple_test.cpp‎
Lines changed: 189 additions & 0 deletions b/‎source/source_hsolver/test/diago_lobpcg_simple_test.cpp‎
Lines changed: 189 additions & 0 deletions
@@ -55,6 +55,7 @@ void print_scf_iterinfo(const std::string& ks_solver,
            {"elpa", "EL"},
            {"dav", "DA"},
            {"dav_subspace", "DS"},
+           {"lobpcg", "LB"},
            {"scalapack_gvx", "GV"},
            {"cusolver", "CU"},
            {"bpcg", "BP"},
 
@@ -6,11 +6,14 @@
 #include "source_estate/elecstate_pw.h"
 #include "source_hamilt/hamilt.h"
 #include "source_hsolver/diag_comm_info.h"
+
 #include "source_hsolver/diago_bpcg.h"
 #include "source_hsolver/diago_cg.h"
 #include "source_hsolver/diago_dav_subspace.h"
 #include "source_hsolver/diago_david.h"
+#include "source_hsolver/diago_lobpcg.h"
 #include "source_hsolver/diago_iter_assist.h"
+
 #include "source_io/module_parameter/parameter.h"
 #include "source_psi/psi.h"
 #include "source_estate/elecstate_tools.h"
@@ -82,7 +85,7 @@ void HSolverPW<T, Device>::solve(hamilt::Hamilt<T, Device>* pHamilt,
     this->nproc_in_pool = nproc_in_pool_in;
 
     // report if the specified diagonalization method is not supported
-    const std::initializer_list<std::string> _methods = {"cg", "dav", "dav_subspace", "bpcg"};
+    const std::initializer_list<std::string> _methods = {"cg", "dav", "dav_subspace", "bpcg", "lobpcg"};
     if (std::find(std::begin(_methods), std::end(_methods), this->method) == std::end(_methods))
     {
         ModuleBase::WARNING_QUIT("HSolverPW::solve", "This type of eigensolver is not supported!");
@@ -393,6 +396,11 @@ void HSolverPW<T, Device>::hamiltSolvePsiK(hamilt::Hamilt<T, Device>* hm,
             hm->sPsi(psi_in, spsi_out, ld_psi, ld_psi, nvec);
         };
 
+        double tolerance = this->diag_thr;
+        int max_iter = this->diag_iter_max;
+        std::cout << "DS default tolerance: " << tolerance << ", max_iter: " << max_iter << std::endl;
+
+
         Diago_DavSubspace<T, Device> dav_subspace(pre_condition,
                                                   psi.get_nbands(),
                                                   psi.get_k_first() ? psi.get_current_ngk()
@@ -467,6 +475,52 @@ void HSolverPW<T, Device>::hamiltSolvePsiK(hamilt::Hamilt<T, Device>* hm,
                                                                                ntry_max,
                                                                                notconv_max));
     }
+    else if (this->method == "lobpcg"){
+        // hpsi_func (X, HX, ld, nvec) -> HX = H(X), X and HX blockvectors of size ld x nvec
+        auto hpsi_func = [hm, cur_nbasis](T* psi_in, T* hpsi_out, const int ld_psi, const int nvec) {
+
+            // Convert "pointer data stucture" to a psi::Psi object
+            auto psi_iter_wrapper = psi::Psi<T, Device>(psi_in, 1, nvec, ld_psi, cur_nbasis);
+
+            psi::Range bands_range(true, 0, 0, nvec - 1);
+
+            using hpsi_info = typename hamilt::Operator<T, Device>::hpsi_info;
+            hpsi_info info(&psi_iter_wrapper, bands_range, hpsi_out);
+            hm->ops->hPsi(info);
+        };
+
+        auto spsi_func = [hm](T* psi_in, T* spsi_out, const int ld_psi, const int nvec) {
+            hm->sPsi(psi_in, spsi_out, ld_psi, ld_psi, nvec);
+        };
+        const int ndim = psi.get_current_ngk();         /// dimension of matrix
+        const int nband = psi.get_nbands();            /// number of eigenpairs sought
+        const int nmax = nband + 20;
+        const int ld_psi = psi.get_nbasis();           /// leading dimension of psi
+
+        bool gen_eig = false;
+
+        double tolerance = this->diag_thr;
+        int max_iter = this->diag_iter_max;
+        // print default tolerance and max_iter for LOBPCG
+        std::cout << "LOBPCG default tolerance: " << tolerance << ", max_iter: " << max_iter << std::endl;
+        max_iter = 1000; // LOBPCG is not stable enough, set max_iter to 200 to avoid divergence. TODO: further test and optimize LOBPCG in the future.
+        if (tolerance > 1e-6)tolerance = 1e-6;
+        std::cout << "LOBPCG current tolerance: " << tolerance << ", max_iter: " << max_iter << std::endl;
+
+        DiagoLOBPCG<T, Device> lobpcg(pre_condition.data(), nband, ndim, nmax);
+        bool ok = lobpcg.diag(hpsi_func, spsi_func, gen_eig,
+            eigenvalue, psi.get_pointer(), ld_psi, tolerance, max_iter);
+    }
+    // now print lowest 5 eigenvalues for debugging
+    if (this->rank_in_pool == 0)
+    {
+        std::cout << "Lowest 5 eigenvalues for current k-point: ";
+        for (int i = 0; i < std::min(5, psi.get_nbands()); i++)
+        {
+            std::cout << eigenvalue[i] << " ";
+        }
+        std::cout << std::endl;
+    }
     ModuleBase::timer::tick("HSolverPW", "solve_psik");
     return;
 }
 
@@ -92,14 +92,14 @@ if (ENABLE_MPI)
   AddTest(
     TARGET MODULE_HSOLVER_pw
     LIBS parameter  ${math_libs} psi device base container
-    SOURCES test_hsolver_pw.cpp ../hsolver_pw.cpp ../hsolver_lcaopw.cpp ../diago_bpcg.cpp ../diago_dav_subspace.cpp ../diag_const_nums.cpp ../diago_iter_assist.cpp ../para_linear_transform.cpp
+    SOURCES test_hsolver_pw.cpp ../hsolver_pw.cpp ../hsolver_lcaopw.cpp ../diago_bpcg.cpp ../diago_dav_subspace.cpp ../diag_const_nums.cpp ../diago_iter_assist.cpp ../para_linear_transform.cpp ../diago_lobpcg.cpp
     ../../source_estate/elecstate_tools.cpp ../../source_estate/occupy.cpp ../../source_base/module_fft/fft_bundle.cpp ../../source_base/module_fft/fft_cpu.cpp
   )
 
   AddTest(
     TARGET MODULE_HSOLVER_sdft
     LIBS parameter  ${math_libs} psi device base container
-    SOURCES test_hsolver_sdft.cpp ../hsolver_pw_sdft.cpp ../hsolver_pw.cpp ../diago_bpcg.cpp ../diago_dav_subspace.cpp ../diag_const_nums.cpp ../diago_iter_assist.cpp ../para_linear_transform.cpp
+    SOURCES test_hsolver_sdft.cpp ../hsolver_pw_sdft.cpp ../hsolver_pw.cpp ../diago_bpcg.cpp ../diago_dav_subspace.cpp ../diag_const_nums.cpp ../diago_iter_assist.cpp ../para_linear_transform.cpp ../diago_lobpcg.cpp
                 ../../source_estate/elecstate_tools.cpp ../../source_estate/occupy.cpp ../../source_base/module_fft/fft_bundle.cpp ../../source_base/module_fft/fft_cpu.cpp
     )
 
 
@@ -0,0 +1,189 @@
+#include <gtest/gtest.h>
+#include <complex>
+#include <vector>
+#include <cmath>
+#include <iostream>
+#include <random>
+#include "source_hsolver/diago_lobpcg.h"
+
+// Define complex double type
+using Complex = std::complex<double>;
+
+// Declare LAPACK zheev helper
+extern "C" {
+    void zheev_(const char* jobz, const char* uplo, const int* n, Complex* a, const int* lda, double* w, Complex* work, const int* lwork, double* rwork, int* info);
+    void zgemm_(const char* transa, const char* transb, const int* m, const int* n, const int* k,
+                const Complex* alpha, const Complex* a, const int* lda,
+                const Complex* b, const int* ldb,
+                const Complex* beta, Complex* c, const int* ldc);
+}
+
+class DiagoLobpcgTest : public testing::Test {
+protected:
+    std::vector<Complex> matrix;
+    
+    // Generate matrix
+    // type 0: Deterministic (Original)
+    // type 1: Random Diagonally Dominant Complex Hermitian
+    void GenerateMatrix(int n, int type) {
+        matrix.resize(n * n);
+        if (type == 0) {
+            for (int j = 0; j < n; ++j) {
+                for (int i = 0; i < n; ++i) {
+                    if (i == j) {
+                        matrix[j * n + i] = static_cast<double>(i + 1); // Diagonal 1..n
+                    } else {
+                        // Off-diagonal 
+                        double val = 1.0 / (std::abs(i - j) + 1.0);
+                        matrix[j * n + i] = val * 0.1; 
+                    }
+                }
+            }
+        } else if (type == 1) {
+            // Random Hermitian matrix
+            // Use specific seed for reproducibility
+            std::mt19937 gen(42); 
+            // Diagonal elements: spaced out to ensure good conditioning for basic LOBPCG
+            // Off-diagonal: small random values
+            std::uniform_real_distribution<> val_dist(-0.5, 0.5);
+
+            for (int j = 0; j < n; ++j) {
+                // Diagonal (real)
+                // j+1 plus small noise. Keeps eigenvalues well separated approx 1.0 apart.
+                matrix[j * n + j] = static_cast<double>(j + 1) + val_dist(gen) * 0.5;
+                
+                // Off-diagonal (complex)
+                for (int i = j + 1; i < n; ++i) {
+                    Complex val(val_dist(gen) * 0.05, val_dist(gen) * 0.05);
+                    // A(i, j) at matrix[j*n + i]
+                    matrix[j * n + i] = val;
+                    // A(j, i) at matrix[i*n + j]
+                    matrix[i * n + j] = std::conj(val);
+                }
+            }
+        }
+    }
+
+    void VerifyLobpcg(int n, int nband, double check_tol = 1e-3, double cg_tol = 1e-5) {
+        // ---------------------------------------------------------
+        // 1. Solve with LAPACK (Gold Standard)
+        // ---------------------------------------------------------
+        std::vector<Complex> mat_lapack = matrix; // Deep copy
+        std::vector<double> ev_lapack(n);
+        
+        Complex work_query;
+        std::vector<double> rwork(3 * n - 2);
+        int lwork_query = -1;
+        int info = 0;
+        int n_val = n;
+        
+        char jobz = 'N'; 
+        char uplo = 'U';
+
+        // Query workspace
+        zheev_(&jobz, &uplo, &n_val, mat_lapack.data(), &n_val, ev_lapack.data(), &work_query, &lwork_query, rwork.data(), &info);
+        
+        int lwork = static_cast<int>(work_query.real()) + 1;
+        std::vector<Complex> work(lwork);
+        
+        // Compute
+        zheev_(&jobz, &uplo, &n_val, mat_lapack.data(), &n_val, ev_lapack.data(), work.data(), &lwork, rwork.data(), &info);
+        
+        ASSERT_EQ(info, 0) << "LAPACK zheev computation failed with info=" << info;
+        
+        // Output LAPACK eigenvalues for debug
+        // std::cout << "LAPACK computed eigenvalues (first 5): ";
+        // for(int i=0; i<5 && i<n; ++i) std::cout << ev_lapack[i] << " ";
+        // std::cout << std::endl;
+
+        // ---------------------------------------------------------
+        // 2. Solve with LOBPCG
+        // ---------------------------------------------------------
+        std::vector<double> precondition(n, 1.0); // Identity Preconditioner
+        
+        int n_max = nband + 5; 
+        hsolver::DiagoLOBPCG<Complex> lobpcg(precondition.data(), nband, n, n_max);
+        
+        std::vector<double> ev_lobpcg(nband);
+        std::vector<Complex> psi(n * nband); 
+        
+        // Initialize psi with values
+        for(auto &val : psi) val = static_cast<double>(rand()) / RAND_MAX;
+        
+        auto hpsi_func = [&](Complex* in, Complex* out, const int ld, const int nvec) {
+            char transa = 'N';
+            char transb = 'N';
+            int m_ = n;
+            int n_ = nvec;
+            int k_ = n;
+            Complex alpha = 1.0;
+            Complex beta = 0.0;
+            int lda = n;
+            
+            zgemm_(&transa, &transb, &m_, &n_, &k_, 
+                   &alpha, matrix.data(), &lda, 
+                   in, &ld, 
+                   &beta, out, &ld);
+        };
+        
+        int max_iter = 2000;
+        bool converged = lobpcg.diag(
+            hpsi_func,
+            nullptr, 
+            false, 
+            ev_lobpcg.data(),
+            psi.data(),
+            n, 
+            cg_tol,
+            max_iter
+        );
+        
+        EXPECT_TRUE(converged) << "LOBPCG did not converge in " << max_iter << " iterations";
+        
+        // Output LOBPCG eigenvalues for debug
+        // std::cout << "LOBPCG computed eigenvalues (first 5): ";
+        // for(int i=0; i<5 && i<nband; ++i) std::cout << ev_lobpcg[i] << " ";
+        // std::cout << std::endl;
+        
+        // ---------------------------------------------------------
+        // 3. Compare Results
+        // ---------------------------------------------------------
+        for(int i = 0; i < nband; ++i) {
+            EXPECT_NEAR(ev_lobpcg[i], ev_lapack[i], check_tol) 
+                << "Mismatch at eigenvalue index " << i 
+                << " LAPACK: " << ev_lapack[i] << " LOBPCG: " << ev_lobpcg[i];
+        }
+        // output anyway even if test passed, for debug
+        std::cout << "Eigenvalues comparison (LOBPCG vs LAPACK):" << std::endl;
+        std::cout << "LAPACK eigenvalues: ";
+        for(int i=0; i<nband; ++i) {
+            std::cout << "Index " << i << ": " << ev_lapack[i] << " vs " << ev_lapack[i] << std::endl;
+        }
+        std::cout << std::endl;
+        std::cout << "LOBPCG eigenvalues: ";
+        for(int i=0; i<nband; ++i) {
+            std::cout << "Index " << i << ": " << ev_lobpcg[i] << " vs " << ev_lapack[i] << std::endl;
+        }
+    }
+};
+
+TEST_F(DiagoLobpcgTest, CompareWithLapack) {
+    int n = 100;
+    int nband = 10;
+    GenerateMatrix(n, 0);
+    VerifyLobpcg(n, nband);
+}
+
+TEST_F(DiagoLobpcgTest, LargeScale) {
+    int n = 200; 
+    int nband = 20;
+    GenerateMatrix(n, 0);
+    VerifyLobpcg(n, nband);
+}
+
+TEST_F(DiagoLobpcgTest, RandomMatrix) {
+    int n = 50;
+    int nband = 10;
+    GenerateMatrix(n, 1);
+    VerifyLobpcg(n, nband, 0.1, 1e-2); 
+}