Some minor optimizations

Avirup Sircar · Avirup Sircar · commit ca415ace1529 · 2025-02-07T08:18:24.000-05:00
diff --git a/analysis/classicalEnrichmentComparison/PSP/KSDFTClassicalUniformQuad/TestKohnShamDft.cpp b/analysis/classicalEnrichmentComparison/PSP/KSDFTClassicalUniformQuad/TestKohnShamDft.cpp
@@ -407,6 +407,7 @@ void getVLoc(
           d_atomTolocPSPSplineMap.push_back(
               utils::Spline(radialValuesSTL,
                     potentialValuesLocSTL,
+                    false,
                     utils::Spline::spline_type::cspline,
                     false,
                     utils::Spline::bd_type::first_deriv,
diff --git a/analysis/classicalEnrichmentComparison/PSP/KSDFTOrthoEFEUniformQuad/TestKohnShamDft.cpp b/analysis/classicalEnrichmentComparison/PSP/KSDFTOrthoEFEUniformQuad/TestKohnShamDft.cpp
@@ -402,6 +402,7 @@ void getVLoc(
           d_atomTolocPSPSplineMap.push_back(
               utils::Spline(radialValuesSTL,
                     potentialValuesLocSTL,
+                    false,
                     utils::Spline::spline_type::cspline,
                     false,
                     utils::Spline::bd_type::first_deriv,
diff --git a/analysis/classicalEnrichmentComparison/PSP/KSDFTOrthoEFEUniformQuad/TestKohnShamDftDeltaRho.cpp b/analysis/classicalEnrichmentComparison/PSP/KSDFTOrthoEFEUniformQuad/TestKohnShamDftDeltaRho.cpp
@@ -287,6 +287,7 @@ void getVLoc(
           d_atomTolocPSPSplineMap.push_back(
               utils::Spline(radialValuesSTL,
                     potentialValuesLocSTL,
+                    false,
                     utils::Spline::spline_type::cspline,
                     false,
                     utils::Spline::bd_type::first_deriv,
diff --git a/analysis/classicalEnrichmentComparison/PSP/Si_BLPS_0.7_nodal.xml b/analysis/classicalEnrichmentComparison/PSP/Si_BLPS_0.7_nodal.xml
diff --git a/src/atoms/SphericalDataNumerical.cpp b/src/atoms/SphericalDataNumerical.cpp
@@ -297,7 +297,8 @@ namespace dftefe
     SphericalDataNumerical::initSpline()
     {
       d_spline = std::make_shared<const utils::Spline>(this->d_radialPoints,
-                                                       this->d_radialValues);
+                                                       this->d_radialValues,
+                                                       true);
     }
 
     double
diff --git a/src/basis/FEBasisOperations.t.cpp b/src/basis/FEBasisOperations.t.cpp
@@ -137,17 +137,24 @@ namespace dftefe
               sameQuadRuleInAllCells && (!variableDofsPerCell);
             linearAlgebra::blasLapack::Layout layout =
               linearAlgebra::blasLapack::Layout::ColMajor;
-            size_type NifNjStartOffset = 0;
+            size_type NifNjStartOffset = 0, quadCellsInBlockOffSet = 0;
 
             /** --- Storages --------- **/
             size_type maxDofInCell =
               *std::max_element(numCellDofs.begin(), numCellDofs.end());
             size_type maxQuadInCell =
               *std::max_element(numCellQuad.begin(), numCellQuad.end());
 
-            StorageUnion fxJxW(1 /*numComponents of f*/ * maxQuadInCell *
-                                 cellBlockSize,
+            const size_type numCumulativeQuadCells =
+              std::accumulate(numCellQuad.begin(), numCellQuad.end(), 0);
+
+            StorageUnion fxJxW(1 /*numComponents of f*/ *
+                                 numCumulativeQuadCells,
                                ValueTypeUnion());
+
+            // StorageUnion fxJxW(1 /*numComponents of f*/ * maxQuadInCell *
+            //                      cellBlockSize,
+            //                    ValueTypeUnion());
             StorageUnion fxJxWxNBlock(maxQuadInCell * cellBlockSize *
                                         maxDofInCell,
                                       ValueTypeUnion());
@@ -161,6 +168,22 @@ namespace dftefe
                                           ValueTypeBasisData());
             /** --- Storages --------- **/
 
+            if (f.getNumberComponents() == 1)
+              {
+                linearAlgebra::blasLapack::hadamardProduct(jxwStorage.size(),
+                                                           jxwStorage.data(),
+                                                           f.begin(),
+                                                           fxJxW.data(),
+                                                           linAlgOpContext);
+              }
+            else
+              {
+                utils::throwException(
+                  false,
+                  "quadValuesContainer f in BasisWeakFormKernelWithField"
+                  " can be only a scalar field in real space with 1 component.");
+              }
+
             for (size_type cellStartId = 0; cellStartId < numLocallyOwnedCells;
                  cellStartId += cellBlockSize)
               {
@@ -182,12 +205,13 @@ namespace dftefe
                                   numCellsInBlockQuad.end(),
                                   0);
 
-                size_type numCumulativeQuadxDofsCellsInBlock = 0;
+                // size_type numCumulativeQuadxDofsCellsInBlock = 0;
                 size_type numCumulativeDofsxDofsCellsInBlock = 0;
                 for (size_type iCell = 0; iCell < numCellsInBlock; iCell++)
                   {
-                    numCumulativeQuadxDofsCellsInBlock +=
-                      numCellsInBlockQuad[iCell] * numCellsInBlockDofs[iCell];
+                    // numCumulativeQuadxDofsCellsInBlock +=
+                    //   numCellsInBlockQuad[iCell] *
+                    //   numCellsInBlockDofs[iCell];
                     numCumulativeDofsxDofsCellsInBlock +=
                       numCellsInBlockDofs[iCell] * numCellsInBlockDofs[iCell];
                   }
@@ -216,25 +240,25 @@ namespace dftefe
                 /** --- Storages --------- **/
 
                 /*--------- Compute fxJxW -----------------*/
-                // TransposedKhatriRao product for inp and JxW
-                size_type cumulativeA = 0, cumulativeB = 0, cumulativeC = 0;
-                for (size_type iCell = 0; iCell < numCellsInBlock; iCell++)
-                  {
-                    linearAlgebra::blasLapack::khatriRaoProduct(
-                      layout,
-                      1,
-                      1,
-                      numCellsInBlockQuad[iCell],
-                      jxwStorage.data() +
-                        quadRuleContainer->getCellQuadStartId(cellStartId) +
-                        cumulativeA,
-                      f.begin(cellStartId) + cumulativeB,
-                      fxJxW.data() + cumulativeC,
-                      linAlgOpContext);
-                    cumulativeA += numCellsInBlockQuad[iCell];
-                    cumulativeB += numCellsInBlockQuad[iCell];
-                    cumulativeC += numCellsInBlockQuad[iCell];
-                  }
+                // // TransposedKhatriRao product for inp and JxW
+                // size_type cumulativeA = 0, cumulativeB = 0, cumulativeC = 0;
+                // for (size_type iCell = 0; iCell < numCellsInBlock; iCell++)
+                //   {
+                //     linearAlgebra::blasLapack::khatriRaoProduct(
+                //       layout,
+                //       1,
+                //       1,
+                //       numCellsInBlockQuad[iCell],
+                //       jxwStorage.data() +
+                //         quadRuleContainer->getCellQuadStartId(cellStartId) +
+                //         cumulativeA,
+                //       f.begin(cellStartId) + cumulativeB,
+                //       fxJxW.data() + cumulativeC,
+                //       linAlgOpContext);
+                //     cumulativeA += numCellsInBlockQuad[iCell];
+                //     cumulativeB += numCellsInBlockQuad[iCell];
+                //     cumulativeC += numCellsInBlockQuad[iCell];
+                //   }
 
                 /*--------- Compute fxJxWxN -----------------*/
                 linearAlgebra::blasLapack::ScalarOp scalarOpA =
@@ -296,7 +320,7 @@ namespace dftefe
                                mSize.data(),
                                nSize.data(),
                                kSize.data(),
-                               fxJxW.data(),
+                               fxJxW.data() + quadCellsInBlockOffSet,
                                basisDataInCellRange.data(),
                                fxJxWxNBlock.data(),
                                linAlgOpContext);
@@ -404,6 +428,7 @@ namespace dftefe
                                linAlgOpContext);
 
                 NifNjStartOffset += numCumulativeDofsxDofsCellsInBlock;
+                quadCellsInBlockOffSet += numCumulativeQuadCellsInBlock;
               }
           }
         else
diff --git a/src/ksdft/Defaults.cpp b/src/ksdft/Defaults.cpp
@@ -44,7 +44,7 @@ namespace dftefe
     const double LinearEigenSolverDefaults::ILL_COND_TOL = 1e-14;
     const double LinearEigenSolverDefaults::LANCZOS_EXTREME_EIGENVAL_TOL = 1e-6;
     const double LinearEigenSolverDefaults::LANCZOS_BETA_TOL = 1e-14;
-    const size_type LinearEigenSolverDefaults::LANCZOS_MAX_KRYLOV_SUBSPACE = 40;
+    const size_type LinearEigenSolverDefaults::LANCZOS_MAX_KRYLOV_SUBSPACE = 20;
     /**
      * @brief Setting all the ChebyshevPolynomialDegreeDefaults
      */
diff --git a/src/ksdft/KohnShamEigenSolver.t.cpp b/src/ksdft/KohnShamEigenSolver.t.cpp
@@ -160,7 +160,8 @@ namespace dftefe
                 1,
                 tol,
                 ksdft::LinearEigenSolverDefaults::LANCZOS_BETA_TOL,
-                *d_lanczosGuess);
+                *d_lanczosGuess,
+                false);
 
       linearAlgebra::MultiVector<ValueType, memorySpace> eigenVectorsLanczos;
 
diff --git a/src/ksdft/KohnShamOperatorContextFE.t.cpp b/src/ksdft/KohnShamOperatorContextFE.t.cpp
@@ -483,6 +483,25 @@ namespace dftefe
 
         size_type BStartOffset       = 0;
         size_type cellLocalIdsOffset = 0;
+
+        size_type maxDofInCell =
+          *std::max_element(numCellDofs.begin(), numCellDofs.end());
+
+        utils::MemoryStorage<ValueTypeOperand, memorySpace> xCellValues(
+          cellBlockSize * numVecs * maxDofInCell,
+          utils::Types<
+            linearAlgebra::blasLapack::scalar_type<ValueTypeOperator,
+                                                   ValueTypeOperand>>::zero);
+
+        utils::MemoryStorage<linearAlgebra::blasLapack::
+                               scalar_type<ValueTypeOperator, ValueTypeOperand>,
+                             memorySpace>
+          yCellValues(
+            cellBlockSize * numVecs * maxDofInCell,
+            utils::Types<
+              linearAlgebra::blasLapack::scalar_type<ValueTypeOperator,
+                                                     ValueTypeOperand>>::zero);
+
         for (size_type cellStartId = 0; cellStartId < numLocallyOwnedCells;
              cellStartId += cellBlockSize)
           {
@@ -504,11 +523,11 @@ namespace dftefe
             cellsInBlockNumDoFs.copyFrom(cellsInBlockNumDoFsSTL);
 
             // allocate memory for cell-wise data for x
-            utils::MemoryStorage<ValueTypeOperand, memorySpace> xCellValues(
-              cellsInBlockNumCumulativeDoFs * numVecs,
-              utils::Types<linearAlgebra::blasLapack::scalar_type<
-                ValueTypeOperator,
-                ValueTypeOperand>>::zero);
+            // utils::MemoryStorage<ValueTypeOperand, memorySpace> xCellValues(
+            //   cellsInBlockNumCumulativeDoFs * numVecs,
+            //   utils::Types<linearAlgebra::blasLapack::scalar_type<
+            //     ValueTypeOperator,
+            //     ValueTypeOperand>>::zero);
 
             // copy x to cell-wise data
             basis::FECellWiseDataOperations<ValueTypeOperand, memorySpace>::
@@ -557,14 +576,14 @@ namespace dftefe
               numVecs);
 
             // allocate memory for cell-wise data for y
-            utils::MemoryStorage<
-              linearAlgebra::blasLapack::scalar_type<ValueTypeOperator,
-                                                     ValueTypeOperand>,
-              memorySpace>
-              yCellValues(cellsInBlockNumCumulativeDoFs * numVecs,
-                          utils::Types<linearAlgebra::blasLapack::scalar_type<
-                            ValueTypeOperator,
-                            ValueTypeOperand>>::zero);
+            // utils::MemoryStorage<
+            //   linearAlgebra::blasLapack::scalar_type<ValueTypeOperator,
+            //                                          ValueTypeOperand>,
+            //   memorySpace>
+            //   yCellValues(cellsInBlockNumCumulativeDoFs * numVecs,
+            //               utils::Types<linearAlgebra::blasLapack::scalar_type<
+            //                 ValueTypeOperator,
+            //                 ValueTypeOperand>>::zero);
 
             linearAlgebra::blasLapack::scalar_type<ValueTypeOperator,
                                                    ValueTypeOperand>
diff --git a/src/linearAlgebra/LanczosExtremeEigenSolver.h b/src/linearAlgebra/LanczosExtremeEigenSolver.h
@@ -83,7 +83,8 @@ namespace dftefe
         const size_type                              numUpperExtermeEigenValues,
         std::vector<double> &                        tolerance,
         double                                       lanczosBetaTolerance,
-        const Vector<ValueTypeOperand, memorySpace> &initialGuess);
+        const Vector<ValueTypeOperand, memorySpace> &initialGuess,
+        bool                                         isAdaptiveSolve = true);
 
       LanczosExtremeEigenSolver(
         const size_type      maxKrylovSubspaceSize,
@@ -93,7 +94,8 @@ namespace dftefe
         double               lanczosBetaTolerance,
         std::shared_ptr<const utils::mpi::MPIPatternP2P<memorySpace>>
                                                       mpiPatternP2P,
-        std::shared_ptr<LinAlgOpContext<memorySpace>> linAlgOpContext);
+        std::shared_ptr<LinAlgOpContext<memorySpace>> linAlgOpContext,
+        bool                                          isAdaptiveSolve = true);
 
       /**
        *@brief Default Destructor
@@ -146,6 +148,7 @@ namespace dftefe
       std::vector<RealType>                 d_diagonal;
       std::vector<RealType>                 d_subDiagonal;
       bool                                  d_isSolved;
+      const bool                            d_isAdaptiveSolve;
 
 
     }; // end of class LanczosExtremeEigenSolver
diff --git a/src/linearAlgebra/LanczosExtremeEigenSolver.t.cpp b/src/linearAlgebra/LanczosExtremeEigenSolver.t.cpp
diff --git a/src/utils/Spline.cpp b/src/utils/Spline.cpp
diff --git a/src/utils/Spline.h b/src/utils/Spline.h

Original file line number	Diff line number	Diff line change
`@@ -297,7 +297,8 @@ namespace dftefe`
`297`	`297`	`SphericalDataNumerical::initSpline()`
`298`	`298`	`{`
`299`	`299`	`d_spline = std::make_shared<const utils::Spline>(this->d_radialPoints,`
`300`		`- this->d_radialValues);`
	`300`	`+ this->d_radialValues,`
	`301`	`+ true);`
`301`	`302`	`}`
`302`	`303`
`303`	`304`	`double`