dftfe/_atomic_centered_non_local_operator_8h_source.html

// ---------------------------------------------------------------------

//

// Copyright (c) 2017-2025 The Regents of the University of Michigan and DFT-FE

// authors.

//

// This file is part of the DFT-FE code.

//

// The DFT-FE code is free software; you can use it, redistribute

// it, and/or modify it under the terms of the GNU Lesser General

// Public License as published by the Free Software Foundation; either

// version 2.1 of the License, or (at your option) any later version.

// The full text of the license can be found in the file LICENSE at

// the top level of the DFT-FE distribution.

//

// ---------------------------------------------------------------------

//

// @author  Kartick Ramakrishnan, Vishal Subramanian, Sambit Das

//


#ifndef DFTFE_ATOMICCENTEREDNONLOCALOPERATOR_H

#define DFTFE_ATOMICCENTEREDNONLOCALOPERATOR_H

#include <MultiVector.h>

#include <headers.h>

#include <AtomCenteredSphericalFunctionContainer.h>

#include <sphericalHarmonicUtils.h>

#include <BLASWrapper.h>

#include <memory>

#include <MemorySpaceType.h>

#include "FEBasisOperations.h"

#include <headers.h>

#include <dftUtils.h>

#include <pseudoUtils.h>

#include <vectorUtilities.h>

#include <MPIPatternP2P.h>

#include <MultiVector.h>

#include <DeviceTypeConfig.h>

#include <cmath>

#include <linearAlgebraOperations.h>


namespace dftfe

{

  /**

   * @brief Enum class that lists

   * used in the non-local Operator

   *

   */


  enum class CouplingStructure

  {

    diagonal,

    dense,

    blockDiagonal

  };


  template <typename ValueType, dftfe::utils::MemorySpace memorySpace>


  class AtomicCenteredNonLocalOperator

  {

  public:

    AtomicCenteredNonLocalOperator(

      std::shared_ptr<dftfe::linearAlgebra::BLASWrapper<memorySpace>>

        BLASWrapperPtr,

      std::shared_ptr<

        dftfe::basis::FEBasisOperations<dataTypes::number, double, memorySpace>>

        basisOperatorPtr,

      std::shared_ptr<AtomCenteredSphericalFunctionContainer>

                      atomCenteredSphericalFunctionContainer,

      const MPI_Comm &mpi_comm_parent,

      const bool      memOptMode               = false,

      const bool      computeSphericalFnTimesX = true,

      const bool      useGlobalCMatrix         = false);


    /**

     * @brief Resizes various internal data members and selects the kpoint of interest.

     * @param[in] kPointIndex specifies the k-point of interest

     */

    void

    initialiseOperatorActionOnX(dftfe::uInt kPointIndex);

    /**

     * @brief initialises the multivector object, waveFunctionBlockSize and resizes various internal data members.

     * @param[in] waveFunctionBlockSize sets the wavefunction block size for the

     * action of the nonlocal operator.

     * @param[out] sphericalFunctionKetTimesVectorParFlattened, the multivector

     * that is initialised based on blocksize and partitioner.

     */

    void

    initialiseFlattenedDataStructure(

      dftfe::uInt waveFunctionBlockSize,

      dftfe::linearAlgebra::MultiVector<ValueType, memorySpace>

        &sphericalFunctionKetTimesVectorParFlattened);

    /**

     * @brief calls internal function: initialisePartitioner, initialiseKpoint and computeCMatrixEntries

     * @param[in] updateSparsity flag on whether the sparstiy patten was

     * updated, hence the partitioner is updated.

     * @param[in] kPointWeights std::vector<double> of size number of kPoints

     * @param[out] kPointCoordinates std::vector<double> of kPoint coordinates

     * @param[in] basisOperationsPtr HOST FEBasisOperations shared_ptr required

     * to indetify the element ids and quad points

     * @param[in] quadratureIndex quadrature index for sampling the spherical

     * function. Quadrature Index is used to reinit basisOperationsPtr

     */

    void

    intitialisePartitionerKPointsAndComputeCMatrixEntries(

      const bool                 updateSparsity,

      const std::vector<double> &kPointWeights,

      const std::vector<double> &kPointCoordinates,

      std::shared_ptr<

        dftfe::basis::FEBasisOperations<dataTypes::number,

                                        double,

                                        dftfe::utils::MemorySpace::HOST>>

        basisOperationsPtr,

      std::shared_ptr<

        dftfe::linearAlgebra::BLASWrapper<dftfe::utils::MemorySpace::HOST>>

                        BLASWrapperHostPtr,

      const dftfe::uInt quadratureIndex);

    /**

     * @brief calls internal function: initialisePartitioner, initialiseKpoint and computeCMatrixEntries

     * @param[in] updateSparsity flag on whether the sparstiy patten was

     * updated, hence the partitioner is updated.

     * @param[in] kPointWeights std::vector<double> of size number of kPoints

     * @param[out] kPointCoordinates std::vector<double> of kPoint coordinates

     * @param[in] basisOperationsPtr HOST FEBasisOperations shared_ptr required

     * to indetify the element ids and quad points

     * @param[in] BLASWrapperHostPtr CPU blasWrapperPtr, used for xcopy calls

     * @param[in] quadratureIndex quadrature index for sampling the spherical

     * function. Quadrature Index is used to reinit basisOperationsPtr

     * @param[in] nonLocalOperatorSrc The source nonLocalOpertor from where the

     * CMatrix and partitioner is copied. Generally, it is of higher precision.

     */

    template <typename ValueTypeSrc>

    void

    copyPartitionerKPointsAndComputeCMatrixEntries(

      const bool                 updateSparsity,

      const std::vector<double> &kPointWeights,

      const std::vector<double> &kPointCoordinates,

      std::shared_ptr<

        dftfe::basis::FEBasisOperations<dataTypes::number,

                                        double,

                                        dftfe::utils::MemorySpace::HOST>>

        basisOperationsPtr,

      std::shared_ptr<

        dftfe::linearAlgebra::BLASWrapper<dftfe::utils::MemorySpace::HOST>>

                        BLASWrapperHostPtr,

      const dftfe::uInt quadratureIndex,

      const std::shared_ptr<

        AtomicCenteredNonLocalOperator<ValueTypeSrc, memorySpace>>

        nonLocalOperatorSrc);

#if defined(DFTFE_WITH_DEVICE)

    // for device specific initialise

    /**

     * @brief

     * @param[in] totalAtomsInCurrentProcessor number of atoms in current

     * processor based on compact support

     * @param[out] totalNonLocalElements number of nonLocal elements in current

     * processor

     * @param[out] numberCellsForEachAtom number of cells associated which each

     * atom in the current processor. vecot of size totalAtomsInCurrentProcessor

     * @param[out] numberCellsAccumNonLocalAtoms number of cells accumulated

     * till iatom in current processor. vector of size

     * totalAtomsInCurrentProcessor

     */

    void

    initialiseCellWaveFunctionPointers(

      dftfe::utils::MemoryStorage<ValueType, dftfe::utils::MemorySpace::DEVICE>

        &cellWaveFunctionMatrix);


    void

    freeDeviceVectors();

#endif


    // Getter functions

    // Returns the vector that takes in nonlocalElementIndex and returns the

    // cellID

    const std::vector<dftfe::uInt> &

    getNonlocalElementToCellIdVector() const;

    // Returns the number of atoms in current processor

    dftfe::uInt

    getTotalAtomInCurrentProcessor() const;


    const dftfe::utils::MemoryStorage<dftfe::uInt, memorySpace> &

    getFlattenedNonLocalCellDofIndexToProcessDofIndexMap() const;


    dftfe::uInt

    getTotalNonLocalElementsInCurrentProcessor() const;


    dftfe::uInt

    getTotalNonLocalEntriesCurrentProcessor() const;


    dftfe::uInt

    getMaxSingleAtomEntries() const;


    bool

    atomSupportInElement(dftfe::uInt iElem) const;


    dftfe::uInt

    getGlobalDofAtomIdSphericalFnPair(const dftfe::uInt atomId,

                                      const dftfe::uInt alpha) const;


    dftfe::uInt

    getLocalIdOfDistributedVec(const dftfe::uInt globalId) const;


    std::vector<dftfe::uInt> &

    getNonLocalElemIdToLocalElemIdMap() const;


    std::vector<dftfe::uInt> &

    getAtomWiseNumberCellsInCompactSupport() const;


    std::vector<dftfe::uInt> &

    getAtomWiseNumberCellsAccumulated() const;


    const std::vector<ValueType> &

    getAtomCenteredKpointIndexedSphericalFnQuadValues() const;


    const std::vector<ValueType> &

    getAtomCenteredKpointTimesSphericalFnTimesDistFromAtomQuadValues() const;


    const std::map<dftfe::uInt, std::vector<dftfe::uInt>> &

    getCellIdToAtomIdsLocalCompactSupportMap() const;


    const std::vector<dftfe::uInt> &

    getNonTrivialSphericalFnsPerCell() const;


    const std::vector<dftfe::uInt> &

    getNonTrivialSphericalFnsCellStartIndex() const;


    const dftfe::uInt

    getTotalNonTrivialSphericalFnsOverAllCells() const;


    const std::vector<dftfe::uInt> &

    getNonTrivialAllCellsSphericalFnAlphaToElemIdMap() const;


    /**

     * @brief Required in configurational forces. Cummulative sphercial Fn Id. The size is numCells in processor

     */

    const std::map<dftfe::uInt, std::vector<dftfe::uInt>> &

    getAtomIdToNonTrivialSphericalFnCellStartIndex() const;


    /**

     * @brief Returns the Flattened vector of sphericalFunctionIDs in order of atomIDs of atoms in processor.

     */

    const std::vector<dftfe::uInt> &

    getSphericalFnTimesVectorFlattenedVectorLocalIds() const;


    const std::vector<dftfe::uInt> &

    getOwnedAtomIdsInCurrentProcessor() const;

    /**

     * @brief Computes C^{T}D^{-1}C at the global level for atomId. This is required in PAW

     */

    void

    computeCconjtransCMatrix(

      const dftfe::uInt atomId,

      std::shared_ptr<

        dftfe::linearAlgebra::BLASWrapper<dftfe::utils::MemorySpace::HOST>>

        BLASWrapperPtr,

      const dftfe::utils::MemoryStorage<double, dftfe::utils::MemorySpace::HOST>

        &Dinverse,

      dftfe::utils::MemoryStorage<ValueType, dftfe::utils::MemorySpace::HOST>

        PconjtransposePmatrix);

    // Calls for both device and host

    /**

     * @brief compute the action of coupling matrix on sphericalFunctionKetTimesVectorParFlattened.

     * @param[in] couplingtype structure of coupling matrix

     * @param[in] couplingMatrix entires of the coupling matrix V in

     * CVCconjtrans. Ensure that the coupling matrix is padded. Refer to

     * ONCVclass for template

     * @param[out] sphericalFunctionKetTimesVectorParFlattened multivector to

     * store results of CconjtransX which is initiliased using

     * initialiseFlattenedVector call. The results are stored in

     * sphericalFunctionKetTimesVectorParFlattened or internal data member based

     * on flagCopyResultsToMatrix.

     * @param[in] flagCopyResultsToMatrix flag to confirm whether to scal the

     * multivector sphericalFunctionKetTimesVectorParFlattened or store results

     * in internal data member.

     */

    void

    applyVOnCconjtransX(

      const CouplingStructure                                    couplingtype,

      const dftfe::utils::MemoryStorage<ValueType, memorySpace> &couplingMatrix,

      dftfe::linearAlgebra::MultiVector<ValueType, memorySpace>

                       &sphericalFunctionKetTimesVectorParFlattened,

      const bool        flagCopyResultsToMatrix = true,

      const dftfe::uInt kPointIndex             = 0);


    /**

     * @brief After AllReduce function is called this will copy to the nonLocalOperatorClassDatastructure.

     */

    void

    copyBackFromDistributedVectorToLocalDataStructure(

      dftfe::linearAlgebra::MultiVector<ValueType, memorySpace>

        &sphericalFunctionKetTimesVectorParFlattened,

      const dftfe::utils::MemoryStorage<double, memorySpace> &scalingVector);

    /**

     * @brief copies the results from internal member to sphericalFunctionKetTimesVectorParFlattened, on which ghost values are called.

     * crucial operation for completion of the full CconjtranX on all cells

     * @param[in] sphericalFunctionKetTimesVectorParFlattened multivector to

     * store results of CconjtransX which is initiliased using

     * initialiseFlattenedVector call

     * @param[in] skip1 flag for compute-communication overlap in ChFSI on GPUs

     * @param[in] skip2 flag for compute-communication overlap in ChFSI on GPUs

     */

    void

    applyAllReduceOnCconjtransX(

      dftfe::linearAlgebra::MultiVector<ValueType, memorySpace>

                &sphericalFunctionKetTimesVectorParFlattened,

      const bool skipComm = false);


    /**

     * @brief computes the results of CconjtransX on the cells of interst specied by cellRange

     * @param[in] X input cell level vector

     * @param[in] cellRange start and end element id in list of nonlocal

     * elements

     */

    void

    applyCconjtransOnX(const ValueType                          *X,

                       const std::pair<dftfe::uInt, dftfe::uInt> cellRange);


    /**

     * @brief computes the results of CconjtransX on nodal X vector

     * @param[in] X input X nodal vector

     * elements

     */

    void

    applyCconjtransOnX(

      const dftfe::linearAlgebra::MultiVector<ValueType, memorySpace> &X);


    // Returns the pointer of CTX stored in HOST memory for the atom Index in

    // the list of atoms with support in the processor.

    /**

     * @brief Returns the pointer of CTX stored in HOST memory

     * @param[in] iAtom atomIndex in the list of atoms with support in the

     * current processor. NOTE!! One must be careful here

     */

    const ValueType *

    getCconjtansXLocalDataStructure(const dftfe::uInt iAtom) const;


    /**

     * @brief completes the VCconjX on nodal vector src. The src vector must have all ghost nodes and constraint nodes updated.

     * @param[in] src input nodal vector on which operator acts on.

     * @param[in] kPointIndex kPoint of interest for current operation

     * @param[in] couplingtype structure of coupling matrix

     * @param[in] couplingMatrix entries of the coupling matrix V in

     * CVCconjtrans. Ensure the coupling matrix is padded

     * @param[out] sphericalFunctionKetTimesVectorParFlattened multivector to

     * store results of CconjtransX which is initiliased using

     * initialiseFlattenedVector call

     */

    void

    applyVCconjtransOnX(

      const dftfe::linearAlgebra::MultiVector<ValueType, memorySpace> &src,

      const dftfe::uInt                                          kPointIndex,

      const CouplingStructure                                    couplingtype,

      const dftfe::utils::MemoryStorage<ValueType, memorySpace> &couplingMatrix,

      dftfe::linearAlgebra::MultiVector<ValueType, memorySpace>

                &sphericalFunctionKetTimesVectorParFlattened,

      const bool flagScaleInternalMatrix = false);


    /**

     * @brief completes the action of CVCconjtranspose on nodal vector src. The src vector must have all ghost nodes and contraint nodes updated.

     * @param[in] src input nodal vector on which operator acts on.

     * @param[in] kPointIndex kPoint of interst for current operation

     * @param[in] couplingtype structure of coupling matrix

     * @param[in] couplingMatrix entires of the coupling matrix V in

     * CVCconjtrans

     * @param[in] sphericalFunctionKetTimesVectorParFlattened multivector to

     * store results of CconjtransX which is initiliased using

     * initialiseFlattenedVector call

     * @param[out] dst output nodal vector where the results of the operator is

     * copied into.

     */

    void

    applyCVCconjtransOnX(

      const dftfe::linearAlgebra::MultiVector<ValueType, memorySpace> &src,

      const dftfe::uInt                                          kPointIndex,

      const CouplingStructure                                    couplingtype,

      const dftfe::utils::MemoryStorage<ValueType, memorySpace> &couplingMatrix,

      dftfe::linearAlgebra::MultiVector<ValueType, memorySpace>

        &sphericalFunctionKetTimesVectorParFlattened,

      dftfe::linearAlgebra::MultiVector<ValueType, memorySpace> &dst);


    /**

     * @brief adds the result of CVCtX onto Xout for both CPU and GPU calls

     * @param[out] Xout memoryStorage object of size

     * cells*numberOfNodex*BlockSize. Typical case holds the results of H_{loc}X

     * @param[in] cellRange start and end element id in list of nonlocal

     * elements

     */

    void

    applyCOnVCconjtransX(ValueType                                *Xout,

                         const std::pair<dftfe::uInt, dftfe::uInt> cellRange);


    /**

     * @brief adds the result of CVCtX onto Xout for both CPU and GPU calls

     * @param[out] Xout memoryStorage object of size

     * cells*numberOfNodex*BlockSize. Typical case holds the results of H_{loc}X

     * @param[in] cellRange start and end element id in list of nonlocal

     * elements

     */

    void

    applyCOnVCconjtransX(

      dftfe::linearAlgebra::MultiVector<ValueType, memorySpace> &Xout);


    std::vector<ValueType>

    getCmatrixEntries(dftfe::Int  kPointIndex,

                      dftfe::uInt atomId,

                      dftfe::Int  iElem) const;


    bool

    atomPresentInCellRange(

      const std::pair<dftfe::uInt, dftfe::uInt> cellRange) const;

    /**

     * @brief Called only for GPU runs where the coupling matrix has to be padded

     * @param[in] entries COupling matrix entries without padding in the atomId

     * order

     * @param[out] entriesPadded Padding of coupling matrix entries

     * @param[in] couplingtype Determines the dimension of entriesPadded and the

     * padding mechanism elements

     */

    void

    paddingCouplingMatrix(const std::vector<ValueType> &entries,

                          std::vector<ValueType>       &entriesPadded,

                          const CouplingStructure       couplingtype);


    /**

     * @brief Returns C matrix entries for chargeId and it compact support element Id.

     */

    const std::vector<ValueType> &

    getCmatrixEntriesConjugate(const dftfe::uInt chargeId,

                               const dftfe::uInt iElemComp) const;

    /**

     * @brief Returns C conj matrix entries for chargeId and it compact support element Id.

     */

    const std::vector<ValueType> &

    getCmatrixEntriesTranspose(const dftfe::uInt chargeId,

                               const dftfe::uInt iElemComp) const;

    /**

     * @brief Returns global C matrix of all atoms.

     */

    const std::vector<

      std::vector<dftfe::utils::MemoryStorage<ValueType, memorySpace>>> &

    getGlobalCMatrix() const;


  protected:

    /**

     * @brief completes the VCconjX on nodal vector src. The src vector must have all ghost nodes and constraint nodes updated.

     * @param[in] src input nodal vector on which operator acts on.

     * @param[in] kPointIndex kPoint of interest for current operation

     * @param[in] couplingtype structure of coupling matrix

     * @param[in] couplingMatrix entries of the coupling matrix V in

     * CVCconjtrans. Ensure the coupling matrix is padded

     * @param[out] sphericalFunctionKetTimesVectorParFlattened multivector to

     * store results of CconjtransX which is initiliased using

     * initialiseFlattenedVector call

     */

    void

    applyVCconjtransOnXCellLevel(

      const dftfe::linearAlgebra::MultiVector<ValueType, memorySpace> &src,

      const dftfe::uInt                                          kPointIndex,

      const CouplingStructure                                    couplingtype,

      const dftfe::utils::MemoryStorage<ValueType, memorySpace> &couplingMatrix,

      dftfe::linearAlgebra::MultiVector<ValueType, memorySpace>

                &sphericalFunctionKetTimesVectorParFlattened,

      const bool flagScaleInternalMatrix = false);


    /**

     * @brief completes the VCconjX on nodal vector src using global C matrix.

     * The global C matrix mush have been computed before.

     * The src vector must have all ghost nodes and constraint nodes updated.

     * @param[in] src input nodal vector on which operator acts on.

     * @param[in] kPointIndex kPoint of interest for current operation

     * @param[in] couplingtype structure of coupling matrix

     * @param[in] couplingMatrix entries of the coupling matrix V in

     * CVCconjtrans. Ensure the coupling matrix is padded

     * @param[out] sphericalFunctionKetTimesVectorParFlattened multivector to

     * store results of CconjtransX which is initiliased using

     * initialiseFlattenedVector call

     */

    void

    applyVCconjtransOnXUsingGlobalC(

      const dftfe::linearAlgebra::MultiVector<ValueType, memorySpace> &src,

      const dftfe::uInt                                          kPointIndex,

      const CouplingStructure                                    couplingtype,

      const dftfe::utils::MemoryStorage<ValueType, memorySpace> &couplingMatrix,

      dftfe::linearAlgebra::MultiVector<ValueType, memorySpace>

                &sphericalFunctionKetTimesVectorParFlattened,

      const bool flagScaleInternalMatrix = false);


    bool                d_AllReduceCompleted;

    std::vector<double> d_kPointWeights;

    std::vector<double> d_kPointCoordinates;

    std::shared_ptr<dftfe::linearAlgebra::BLASWrapper<memorySpace>>

      d_BLASWrapperPtr;

    std::shared_ptr<AtomCenteredSphericalFunctionContainer>

      d_atomCenteredSphericalFunctionContainer;

    std::shared_ptr<

      const utils::mpi::MPIPatternP2P<dftfe::utils::MemorySpace::HOST>>

                             d_mpiPatternP2P;

    std::vector<dftfe::uInt> d_numberCellsForEachAtom;


    std::shared_ptr<

      dftfe::basis::FEBasisOperations<dataTypes::number, double, memorySpace>>

      d_basisOperatorPtr;


    // Required by force.cc

    std::vector<ValueType> d_atomCenteredKpointIndexedSphericalFnQuadValues;

    // Required for stress compute

    std::vector<ValueType>

      d_atomCenteredKpointTimesSphericalFnTimesDistFromAtomQuadValues;


    /// map from cell number to set of non local atom ids (local numbering)

    std::map<dftfe::uInt, std::vector<dftfe::uInt>>

      d_cellIdToAtomIdsLocalCompactSupportMap;


    /// vector of size num physical cells

    std::vector<dftfe::uInt> d_nonTrivialSphericalFnPerCell;


    /// vector of size num physical cell with starting index for each cell for

    /// the above array

    std::vector<dftfe::uInt> d_nonTrivialSphericalFnsCellStartIndex;


    std::vector<dftfe::uInt> d_nonTrivialAllCellsSphericalFnAlphaToElemIdMap;


    /// map from local nonlocal atomid to vector over cells

    std::map<dftfe::uInt, std::vector<dftfe::uInt>>

      d_atomIdToNonTrivialSphericalFnCellStartIndex;


    dftfe::uInt d_sumNonTrivialSphericalFnOverAllCells;


    std::vector<dftfe::uInt> d_sphericalFnTimesVectorFlattenedVectorLocalIds;


    // The above set of variables are needed in force class


#ifdef USE_COMPLEX

    std::vector<distributedCPUVec<std::complex<double>>>

      d_SphericalFunctionKetTimesVectorPar;


#else

    std::vector<distributedCPUVec<double>> d_SphericalFunctionKetTimesVectorPar;

#endif


    std::map<std::pair<dftfe::uInt, dftfe::uInt>, dftfe::uInt>

      d_sphericalFunctionIdsNumberingMapCurrentProcess;


    std::vector<dftfe::uInt> d_OwnedAtomIdsInCurrentProcessor;

    dealii::IndexSet         d_locallyOwnedAtomCenteredFnIdsCurrentProcess;

    dealii::IndexSet         d_ghostAtomCenteredFnIdsCurrentProcess;

    std::map<std::pair<dftfe::uInt, dftfe::uInt>, dftfe::uInt>

      d_AtomCenteredFnIdsNumberingMapCurrentProcess;

    std::vector<std::vector<

      std::vector<dftfe::utils::MemoryStorage<ValueType, memorySpace>>>>

                               d_CMatrixEntries;

    dealii::ConditionalOStream pcout;

    const MPI_Comm             d_mpi_communicator;

    const dftfe::uInt          d_this_mpi_process;

    const dftfe::uInt          d_n_mpi_processes;

    dealii::IndexSet           d_locallyOwnedSphericalFunctionIdsCurrentProcess;

    dealii::IndexSet           d_ghostSphericalFunctionIdsCurrentProcess;


    dftfe::uInt d_totalAtomsInCurrentProc; // number of atoms of interst with

                                           // compact in current processor

    dftfe::uInt

      d_totalNonlocalElems; // number of nonlocal FE celss having nonlocal

                            // contribution in current processor

    dftfe::uInt d_totalNonLocalEntries; // Total number of nonlocal components

    dftfe::uInt

      d_maxSingleAtomContribution; // maximum number of nonlocal indexes across

                                   // all atoms of interset

    std::vector<dftfe::uInt> d_numberCellsAccumNonLocalAtoms;

    dftfe::utils::MemoryStorage<dftfe::uInt, memorySpace>

                d_iElemNonLocalToElemIndexMap;

    dftfe::uInt d_numberNodesPerElement; // Access from BasisOperator WHile

                                         // filling CMatrixEntries

    dftfe::uInt d_locallyOwnedCells;

    dftfe::uInt d_numberWaveFunctions;

    dftfe::uInt d_kPointIndex;

    bool        d_memoryOptMode;

    bool        d_isMallocCalled = false;

    // Host CMatrix Entries are stored here

    std::vector<std::vector<std::vector<ValueType>>> d_CMatrixEntriesConjugate,

      d_CMatrixEntriesTranspose;


  private:

    /**

     * @brief stores the d_kpointWeights, d_kpointCoordinates. Other data members regarding are computed from container data object

     * @param[in] kPointWeights std::vector<double> of size number of kPoints

     * @param[out] kPointCoordinates std::vector<double> of kPoint coordinates

     */

    void

    initKpoints(const std::vector<double> &kPointWeights,

                const std::vector<double> &kPointCoordinates);

    /**

     * @brief creates the partitioner for the distributed vector based on sparsity patten from sphericalFn container.

     * @param[in] basisOperationsPtr HOST FEBasisOperations shared_ptr required

     * to indetify the element ids and quad points.

     */

    void

    initialisePartitioner();

    /**

     * @brief computes the entries in C matrix for CPUs and GPUs. On GPUs the entries are copied to a flattened vector on device memory.

     * Further on GPUs, various maps are created crucial for accessing and

     * padding entries in Cmatrix flattened device.

     * @param[in] basisOperationsPtr HOST FEBasisOperations shared_ptr required

     * to indetify the element ids and quad points

     * @param[in] quadratureIndex quadrature index for sampling the spherical

     * function. Quadrature Index is used to reinit basisOperationsPtr

     */

    void

    computeCMatrixEntries(

      std::shared_ptr<dftfe::basis::FEBasisOperations<

        dataTypes::number,

        double,

        dftfe::utils::MemorySpace::HOST>> basisOperationsPtr,

      const dftfe::uInt                   quadratureIndex);


    template <typename ValueTypeSrc>

    void

    copyCMatrixEntries(

      const std::shared_ptr<

        AtomicCenteredNonLocalOperator<ValueTypeSrc, memorySpace>>

        nonLocalOperatorSrc,

      std::shared_ptr<

        dftfe::basis::FEBasisOperations<dataTypes::number,

                                        double,

                                        dftfe::utils::MemorySpace::HOST>>

                        basisOperationsPtr,

      const dftfe::uInt quadratureIndex);


    template <typename ValueTypeSrc>

    void

    copyGlobalCMatrix(

      const std::shared_ptr<

        AtomicCenteredNonLocalOperator<ValueTypeSrc, memorySpace>>

        nonLocalOperatorSrc,

      std::shared_ptr<

        dftfe::basis::FEBasisOperations<dataTypes::number,

                                        double,

                                        dftfe::utils::MemorySpace::HOST>>

                        basisOperationsPtr,

      const dftfe::uInt quadratureIndex);


    std::map<

      dftfe::uInt,

      dftfe::utils::MemoryStorage<ValueType, dftfe::utils::MemorySpace::HOST>>

      d_sphericalFnTimesWavefunMatrix;

    std::vector<dftfe::uInt>

      d_flattenedNonLocalCellDofIndexToProcessDofIndexVector;

    dftfe::utils::MemoryStorage<dftfe::uInt, memorySpace>

      d_flattenedNonLocalCellDofIndexToProcessDofIndexMap;

    std::vector<dftfe::uInt> d_nonlocalElemIdToCellIdVector;

    bool                     d_computeSphericalFnTimesX;

    bool                     d_useGlobalCMatrix;

    std::vector<dftfe::uInt> d_atomStartIndexGlobal;

    dftfe::uInt              d_totalNumSphericalFunctionsGlobal;


    std::vector<

      std::vector<dftfe::utils::MemoryStorage<ValueType, memorySpace>>>

      d_CMatrixGlobal;


    std::set<dftfe::uInt>    d_setOfAtomicNumber;

    std::vector<dftfe::uInt> d_mapAtomIdToSpeciesIndex,

      d_mapiAtomToSpeciesIndex;

    std::vector<dftfe::utils::MemoryStorage<ValueType, memorySpace>>

                             d_dotProductAtomicWaveInputWaveTemp;

    std::vector<dftfe::uInt> d_mapIAtomicNumToDotProd;

    std::vector<dftfe::uInt> d_mapiAtomToDotProd;


    dftfe::uInt d_totalLocallyOwnedNodes;


    std::vector<dftfe::uInt> d_mapiAtomTosphFuncWaveStart;

    std::map<dftfe::uInt, std::vector<dftfe::uInt>> d_listOfiAtomInSpecies;


    /**

     * @brief computes Global Cmatrix on HOST.

     * @param[in] basisOperationsPtr HOST FEBasisOperations shared_ptr required

     * to indetify the element ids and quad points

     * @param[in] BLASWrapperHostPtr HOST BLASWrapper

     */

    void

    computeGlobalCMatrixVector(

      std::shared_ptr<dftfe::basis::FEBasisOperations<

        dataTypes::number,

        double,

        dftfe::utils::MemorySpace::HOST>> basisOperationsPtr,

      std::shared_ptr<

        dftfe::linearAlgebra::BLASWrapper<dftfe::utils::MemorySpace::HOST>>

        BLASWrapperHostPtr);


#if defined(DFTFE_WITH_DEVICE)

    /**

     * @brief Copies the data from distributed Vector to Padded Memory storage object.

     * @param[in] sphericalFunctionKetTimesVectorParFlattened Distributed Vector

     * @param[out] paddedVector Padded Vector of size

     * noAtomsInProc*maxSingleAtomContribution*Nwfc

     */

    void

    copyDistributedVectorToPaddedMemoryStorageVectorDevice(

      const dftfe::linearAlgebra::MultiVector<ValueType, memorySpace>

        &sphericalFunctionKetTimesVectorParFlattened,

      dftfe::utils::MemoryStorage<ValueType, memorySpace> &paddedVector);


    /**

     * @brief Copies Padded Memory storage object to Distributed vector.

     * @param[in] paddedVector Padded Vector of size

     * noAtomsInProc*maxSingleAtomContribution*Nwfc

     * @param[out] sphericalFunctionKetTimesVectorParFlattened Distributed

     * Vector

     *

     */

    void

    copyPaddedMemoryStorageVectorToDistributeVectorDevice(

      const dftfe::utils::MemoryStorage<ValueType, memorySpace> &paddedVector,

      dftfe::linearAlgebra::MultiVector<ValueType, memorySpace>

        &sphericalFunctionKetTimesVectorParFlattened);


    dftfe::utils::MemoryStorage<ValueType, dftfe::utils::MemorySpace::HOST>

      d_tempConjtansX;

    dftfe::utils::MemoryStorage<ValueType, dftfe::utils::MemorySpace::DEVICE>

                d_sphericalFnTimesWavefunctionMatrix;

    ValueType **hostPointerCDagger, **hostPointerCDaggeOutTemp,

      **hostWfcPointers;

    ValueType  *d_wfcStartPointer;

    ValueType **devicePointerCDagger, **devicePointerCDaggerOutTemp,

      **deviceWfcPointers;

    std::vector<dftfe::uInt> d_nonlocalElemIdToLocalElemIdMap;


    // The below memory storage objects receives the copy of the distributed

    // ketTimesWfc data in a padded form. THe padding is done by

    // copyDistributedVectorToPaddedMemoryStorageVector

    dftfe::utils::MemoryStorage<ValueType, memorySpace>

      d_sphericalFnTimesVectorDevice;

    // Data structures moved from KSOperatorDevice

    std::vector<ValueType> d_cellHamiltonianMatrixNonLocalFlattenedConjugate;

    dftfe::utils::MemoryStorage<ValueType, dftfe::utils::MemorySpace::DEVICE>

      d_cellHamiltonianMatrixNonLocalFlattenedConjugateDevice;

    std::vector<ValueType> d_cellHamiltonianMatrixNonLocalFlattenedTranspose;

    dftfe::utils::MemoryStorage<ValueType, dftfe::utils::MemorySpace::DEVICE>

      d_cellHamiltonianMatrixNonLocalFlattenedTransposeDevice;

    dftfe::utils::MemoryStorage<ValueType, dftfe::utils::MemorySpace::DEVICE>

      d_cellHamMatrixTimesWaveMatrixNonLocalDevice;

    dftfe::utils::MemoryStorage<ValueType, dftfe::utils::MemorySpace::DEVICE>

                           d_sphericalFnTimesVectorAllCellsDevice;

    std::vector<ValueType> d_sphericalFnTimesVectorAllCellsReduction;

    dftfe::utils::MemoryStorage<ValueType, dftfe::utils::MemorySpace::DEVICE>

      d_sphericalFnTimesVectorAllCellsReductionDevice;


    std::vector<dftfe::uInt> d_mapSphericalFnTimesVectorAllCellsReduction;

    dftfe::utils::MemoryStorage<dftfe::uInt, dftfe::utils::MemorySpace::DEVICE>

      d_mapSphericalFnTimesVectorAllCellsReductionDevice;

    dftfe::utils::MemoryStorage<ValueType, dftfe::utils::MemorySpace::DEVICE>

      d_couplingMatrixTimesVectorDevice;


    std::vector<dftfe::uInt> d_sphericalFnIdsParallelNumberingMap;

    std::vector<dftfe::Int>  d_sphericalFnIdsPaddedParallelNumberingMap;

    dftfe::utils::MemoryStorage<dftfe::uInt, dftfe::utils::MemorySpace::DEVICE>

      d_sphericalFnIdsParallelNumberingMapDevice;

    dftfe::utils::MemoryStorage<dftfe::Int, dftfe::utils::MemorySpace::DEVICE>

      d_sphericalFnIdsPaddedParallelNumberingMapDevice;

    std::vector<dftfe::Int>

      d_indexMapFromPaddedNonLocalVecToParallelNonLocalVec;

    dftfe::utils::MemoryStorage<dftfe::Int, dftfe::utils::MemorySpace::DEVICE>

      d_indexMapFromPaddedNonLocalVecToParallelNonLocalVecDevice;

    std::vector<dftfe::uInt> d_cellNodeIdMapNonLocalToLocal;


    dftfe::utils::MemoryStorage<dftfe::uInt, dftfe::utils::MemorySpace::DEVICE>

      d_cellNodeIdMapNonLocalToLocalDevice;

#endif

  };


} // namespace dftfe

#endif // DFTFE_ATOMICCENTEREDNONLOCALOPERATOR_H

AtomCenteredSphericalFunctionContainer.h

BLASWrapper.h

DeviceTypeConfig.h

FEBasisOperations.h

MPIPatternP2P.h

MemorySpaceType.h

MultiVector.h

dftfe::AtomicCenteredNonLocalOperator::computeCMatrixEntries
void computeCMatrixEntries(std::shared_ptr< dftfe::basis::FEBasisOperations< dataTypes::number, double, dftfe::utils::MemorySpace::HOST > > basisOperationsPtr, const dftfe::uInt quadratureIndex)
computes the entries in C matrix for CPUs and GPUs. On GPUs the entries are copied to a flattened vec...

dftfe::AtomicCenteredNonLocalOperator::atomPresentInCellRange
bool atomPresentInCellRange(const std::pair< dftfe::uInt, dftfe::uInt > cellRange) const

dftfe::AtomicCenteredNonLocalOperator::initKpoints
void initKpoints(const std::vector< double > &kPointWeights, const std::vector< double > &kPointCoordinates)
stores the d_kpointWeights, d_kpointCoordinates. Other data members regarding are computed from conta...

dftfe::AtomicCenteredNonLocalOperator::d_atomCenteredKpointIndexedSphericalFnQuadValues
std::vector< ValueType > d_atomCenteredKpointIndexedSphericalFnQuadValues
Definition AtomicCenteredNonLocalOperator.h:511

dftfe::AtomicCenteredNonLocalOperator::applyVCconjtransOnX
void applyVCconjtransOnX(const dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &src, const dftfe::uInt kPointIndex, const CouplingStructure couplingtype, const dftfe::utils::MemoryStorage< ValueType, memorySpace > &couplingMatrix, dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &sphericalFunctionKetTimesVectorParFlattened, const bool flagScaleInternalMatrix=false)
completes the VCconjX on nodal vector src. The src vector must have all ghost nodes and constraint no...

dftfe::AtomicCenteredNonLocalOperator::AtomicCenteredNonLocalOperator
AtomicCenteredNonLocalOperator(std::shared_ptr< dftfe::linearAlgebra::BLASWrapper< memorySpace > > BLASWrapperPtr, std::shared_ptr< dftfe::basis::FEBasisOperations< dataTypes::number, double, memorySpace > > basisOperatorPtr, std::shared_ptr< AtomCenteredSphericalFunctionContainer > atomCenteredSphericalFunctionContainer, const MPI_Comm &mpi_comm_parent, const bool memOptMode=false, const bool computeSphericalFnTimesX=true, const bool useGlobalCMatrix=false)

dftfe::AtomicCenteredNonLocalOperator::d_mapiAtomToDotProd
std::vector< dftfe::uInt > d_mapiAtomToDotProd
Definition AtomicCenteredNonLocalOperator.h:674

dftfe::AtomicCenteredNonLocalOperator::d_totalNumSphericalFunctionsGlobal
dftfe::uInt d_totalNumSphericalFunctionsGlobal
Definition AtomicCenteredNonLocalOperator.h:662

dftfe::AtomicCenteredNonLocalOperator::d_locallyOwnedAtomCenteredFnIdsCurrentProcess
dealii::IndexSet d_locallyOwnedAtomCenteredFnIdsCurrentProcess
Definition AtomicCenteredNonLocalOperator.h:551

dftfe::AtomicCenteredNonLocalOperator::d_atomIdToNonTrivialSphericalFnCellStartIndex
std::map< dftfe::uInt, std::vector< dftfe::uInt > > d_atomIdToNonTrivialSphericalFnCellStartIndex
map from local nonlocal atomid to vector over cells
Definition AtomicCenteredNonLocalOperator.h:531

dftfe::AtomicCenteredNonLocalOperator::getTotalAtomInCurrentProcessor
dftfe::uInt getTotalAtomInCurrentProcessor() const

dftfe::AtomicCenteredNonLocalOperator::d_dotProductAtomicWaveInputWaveTemp
std::vector< dftfe::utils::MemoryStorage< ValueType, memorySpace > > d_dotProductAtomicWaveInputWaveTemp
Definition AtomicCenteredNonLocalOperator.h:672

dftfe::AtomicCenteredNonLocalOperator::getSphericalFnTimesVectorFlattenedVectorLocalIds
const std::vector< dftfe::uInt > & getSphericalFnTimesVectorFlattenedVectorLocalIds() const
Returns the Flattened vector of sphericalFunctionIDs in order of atomIDs of atoms in processor.

dftfe::AtomicCenteredNonLocalOperator::d_useGlobalCMatrix
bool d_useGlobalCMatrix
Definition AtomicCenteredNonLocalOperator.h:660

dftfe::AtomicCenteredNonLocalOperator::getCmatrixEntriesConjugate
const std::vector< ValueType > & getCmatrixEntriesConjugate(const dftfe::uInt chargeId, const dftfe::uInt iElemComp) const
Returns C matrix entries for chargeId and it compact support element Id.

dftfe::AtomicCenteredNonLocalOperator::d_kPointWeights
std::vector< double > d_kPointWeights
Definition AtomicCenteredNonLocalOperator.h:494

dftfe::AtomicCenteredNonLocalOperator::d_n_mpi_processes
const dftfe::uInt d_n_mpi_processes
Definition AtomicCenteredNonLocalOperator.h:561

dftfe::AtomicCenteredNonLocalOperator::getCmatrixEntries
std::vector< ValueType > getCmatrixEntries(dftfe::Int kPointIndex, dftfe::uInt atomId, dftfe::Int iElem) const

dftfe::AtomicCenteredNonLocalOperator::d_AllReduceCompleted
bool d_AllReduceCompleted
Definition AtomicCenteredNonLocalOperator.h:493

dftfe::AtomicCenteredNonLocalOperator::getAtomIdToNonTrivialSphericalFnCellStartIndex
const std::map< dftfe::uInt, std::vector< dftfe::uInt > > & getAtomIdToNonTrivialSphericalFnCellStartIndex() const
Required in configurational forces. Cummulative sphercial Fn Id. The size is numCells in processor.

dftfe::AtomicCenteredNonLocalOperator::d_cellIdToAtomIdsLocalCompactSupportMap
std::map< dftfe::uInt, std::vector< dftfe::uInt > > d_cellIdToAtomIdsLocalCompactSupportMap
map from cell number to set of non local atom ids (local numbering)
Definition AtomicCenteredNonLocalOperator.h:518

dftfe::AtomicCenteredNonLocalOperator::d_flattenedNonLocalCellDofIndexToProcessDofIndexVector
std::vector< dftfe::uInt > d_flattenedNonLocalCellDofIndexToProcessDofIndexVector
Definition AtomicCenteredNonLocalOperator.h:655

dftfe::AtomicCenteredNonLocalOperator::copyPartitionerKPointsAndComputeCMatrixEntries
void copyPartitionerKPointsAndComputeCMatrixEntries(const bool updateSparsity, const std::vector< double > &kPointWeights, const std::vector< double > &kPointCoordinates, std::shared_ptr< dftfe::basis::FEBasisOperations< dataTypes::number, double, dftfe::utils::MemorySpace::HOST > > basisOperationsPtr, std::shared_ptr< dftfe::linearAlgebra::BLASWrapper< dftfe::utils::MemorySpace::HOST > > BLASWrapperHostPtr, const dftfe::uInt quadratureIndex, const std::shared_ptr< AtomicCenteredNonLocalOperator< ValueTypeSrc, memorySpace > > nonLocalOperatorSrc)
calls internal function: initialisePartitioner, initialiseKpoint and computeCMatrixEntries

dftfe::AtomicCenteredNonLocalOperator::getAtomCenteredKpointTimesSphericalFnTimesDistFromAtomQuadValues
const std::vector< ValueType > & getAtomCenteredKpointTimesSphericalFnTimesDistFromAtomQuadValues() const

dftfe::AtomicCenteredNonLocalOperator::d_AtomCenteredFnIdsNumberingMapCurrentProcess
std::map< std::pair< dftfe::uInt, dftfe::uInt >, dftfe::uInt > d_AtomCenteredFnIdsNumberingMapCurrentProcess
Definition AtomicCenteredNonLocalOperator.h:554

dftfe::AtomicCenteredNonLocalOperator::d_numberWaveFunctions
dftfe::uInt d_numberWaveFunctions
Definition AtomicCenteredNonLocalOperator.h:580

dftfe::AtomicCenteredNonLocalOperator::d_nonlocalElemIdToCellIdVector
std::vector< dftfe::uInt > d_nonlocalElemIdToCellIdVector
Definition AtomicCenteredNonLocalOperator.h:658

dftfe::AtomicCenteredNonLocalOperator::d_mpi_communicator
const MPI_Comm d_mpi_communicator
Definition AtomicCenteredNonLocalOperator.h:559

dftfe::AtomicCenteredNonLocalOperator::d_mapiAtomTosphFuncWaveStart
std::vector< dftfe::uInt > d_mapiAtomTosphFuncWaveStart
Definition AtomicCenteredNonLocalOperator.h:678

dftfe::AtomicCenteredNonLocalOperator::d_locallyOwnedCells
dftfe::uInt d_locallyOwnedCells
Definition AtomicCenteredNonLocalOperator.h:579

dftfe::AtomicCenteredNonLocalOperator::d_listOfiAtomInSpecies
std::map< dftfe::uInt, std::vector< dftfe::uInt > > d_listOfiAtomInSpecies
Definition AtomicCenteredNonLocalOperator.h:679

dftfe::AtomicCenteredNonLocalOperator::d_setOfAtomicNumber
std::set< dftfe::uInt > d_setOfAtomicNumber
Definition AtomicCenteredNonLocalOperator.h:668

dftfe::AtomicCenteredNonLocalOperator::d_iElemNonLocalToElemIndexMap
dftfe::utils::MemoryStorage< dftfe::uInt, memorySpace > d_iElemNonLocalToElemIndexMap
Definition AtomicCenteredNonLocalOperator.h:576

dftfe::AtomicCenteredNonLocalOperator::d_kPointIndex
dftfe::uInt d_kPointIndex
Definition AtomicCenteredNonLocalOperator.h:581

dftfe::AtomicCenteredNonLocalOperator::paddingCouplingMatrix
void paddingCouplingMatrix(const std::vector< ValueType > &entries, std::vector< ValueType > &entriesPadded, const CouplingStructure couplingtype)
Called only for GPU runs where the coupling matrix has to be padded.

dftfe::AtomicCenteredNonLocalOperator::d_maxSingleAtomContribution
dftfe::uInt d_maxSingleAtomContribution
Definition AtomicCenteredNonLocalOperator.h:572

dftfe::AtomicCenteredNonLocalOperator::d_ghostSphericalFunctionIdsCurrentProcess
dealii::IndexSet d_ghostSphericalFunctionIdsCurrentProcess
Definition AtomicCenteredNonLocalOperator.h:563

dftfe::AtomicCenteredNonLocalOperator::d_CMatrixEntriesConjugate
std::vector< std::vector< std::vector< ValueType > > > d_CMatrixEntriesConjugate
Definition AtomicCenteredNonLocalOperator.h:585

dftfe::AtomicCenteredNonLocalOperator::d_nonTrivialSphericalFnsCellStartIndex
std::vector< dftfe::uInt > d_nonTrivialSphericalFnsCellStartIndex
Definition AtomicCenteredNonLocalOperator.h:525

dftfe::AtomicCenteredNonLocalOperator::d_basisOperatorPtr
std::shared_ptr< dftfe::basis::FEBasisOperations< dataTypes::number, double, memorySpace > > d_basisOperatorPtr
Definition AtomicCenteredNonLocalOperator.h:507

dftfe::AtomicCenteredNonLocalOperator::d_CMatrixEntriesTranspose
std::vector< std::vector< std::vector< ValueType > > > d_CMatrixEntriesTranspose
Definition AtomicCenteredNonLocalOperator.h:586

dftfe::AtomicCenteredNonLocalOperator::getNonTrivialAllCellsSphericalFnAlphaToElemIdMap
const std::vector< dftfe::uInt > & getNonTrivialAllCellsSphericalFnAlphaToElemIdMap() const

dftfe::AtomicCenteredNonLocalOperator::d_totalAtomsInCurrentProc
dftfe::uInt d_totalAtomsInCurrentProc
Definition AtomicCenteredNonLocalOperator.h:565

dftfe::AtomicCenteredNonLocalOperator::d_SphericalFunctionKetTimesVectorPar
std::vector< distributedCPUVec< double > > d_SphericalFunctionKetTimesVectorPar
Definition AtomicCenteredNonLocalOperator.h:544

dftfe::AtomicCenteredNonLocalOperator::intitialisePartitionerKPointsAndComputeCMatrixEntries
void intitialisePartitionerKPointsAndComputeCMatrixEntries(const bool updateSparsity, const std::vector< double > &kPointWeights, const std::vector< double > &kPointCoordinates, std::shared_ptr< dftfe::basis::FEBasisOperations< dataTypes::number, double, dftfe::utils::MemorySpace::HOST > > basisOperationsPtr, std::shared_ptr< dftfe::linearAlgebra::BLASWrapper< dftfe::utils::MemorySpace::HOST > > BLASWrapperHostPtr, const dftfe::uInt quadratureIndex)
calls internal function: initialisePartitioner, initialiseKpoint and computeCMatrixEntries

dftfe::AtomicCenteredNonLocalOperator::d_sumNonTrivialSphericalFnOverAllCells
dftfe::uInt d_sumNonTrivialSphericalFnOverAllCells
Definition AtomicCenteredNonLocalOperator.h:533

dftfe::AtomicCenteredNonLocalOperator::d_computeSphericalFnTimesX
bool d_computeSphericalFnTimesX
Definition AtomicCenteredNonLocalOperator.h:659

dftfe::AtomicCenteredNonLocalOperator::d_sphericalFnTimesWavefunMatrix
std::map< dftfe::uInt, dftfe::utils::MemoryStorage< ValueType, dftfe::utils::MemorySpace::HOST > > d_sphericalFnTimesWavefunMatrix
Definition AtomicCenteredNonLocalOperator.h:653

dftfe::AtomicCenteredNonLocalOperator::d_totalLocallyOwnedNodes
dftfe::uInt d_totalLocallyOwnedNodes
Definition AtomicCenteredNonLocalOperator.h:676

dftfe::AtomicCenteredNonLocalOperator::d_CMatrixGlobal
std::vector< std::vector< dftfe::utils::MemoryStorage< ValueType, memorySpace > > > d_CMatrixGlobal
Definition AtomicCenteredNonLocalOperator.h:666

dftfe::AtomicCenteredNonLocalOperator::getOwnedAtomIdsInCurrentProcessor
const std::vector< dftfe::uInt > & getOwnedAtomIdsInCurrentProcessor() const

dftfe::AtomicCenteredNonLocalOperator::getAtomCenteredKpointIndexedSphericalFnQuadValues
const std::vector< ValueType > & getAtomCenteredKpointIndexedSphericalFnQuadValues() const

dftfe::AtomicCenteredNonLocalOperator::d_nonTrivialSphericalFnPerCell
std::vector< dftfe::uInt > d_nonTrivialSphericalFnPerCell
vector of size num physical cells
Definition AtomicCenteredNonLocalOperator.h:521

dftfe::AtomicCenteredNonLocalOperator::d_numberCellsAccumNonLocalAtoms
std::vector< dftfe::uInt > d_numberCellsAccumNonLocalAtoms
Definition AtomicCenteredNonLocalOperator.h:574

dftfe::AtomicCenteredNonLocalOperator::applyAllReduceOnCconjtransX
void applyAllReduceOnCconjtransX(dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &sphericalFunctionKetTimesVectorParFlattened, const bool skipComm=false)
copies the results from internal member to sphericalFunctionKetTimesVectorParFlattened,...

dftfe::AtomicCenteredNonLocalOperator::applyCOnVCconjtransX
void applyCOnVCconjtransX(dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &Xout)
adds the result of CVCtX onto Xout for both CPU and GPU calls

dftfe::AtomicCenteredNonLocalOperator::getAtomWiseNumberCellsInCompactSupport
std::vector< dftfe::uInt > & getAtomWiseNumberCellsInCompactSupport() const

dftfe::AtomicCenteredNonLocalOperator::d_BLASWrapperPtr
std::shared_ptr< dftfe::linearAlgebra::BLASWrapper< memorySpace > > d_BLASWrapperPtr
Definition AtomicCenteredNonLocalOperator.h:497

dftfe::AtomicCenteredNonLocalOperator::copyCMatrixEntries
void copyCMatrixEntries(const std::shared_ptr< AtomicCenteredNonLocalOperator< ValueTypeSrc, memorySpace > > nonLocalOperatorSrc, std::shared_ptr< dftfe::basis::FEBasisOperations< dataTypes::number, double, dftfe::utils::MemorySpace::HOST > > basisOperationsPtr, const dftfe::uInt quadratureIndex)

dftfe::AtomicCenteredNonLocalOperator::d_mapiAtomToSpeciesIndex
std::vector< dftfe::uInt > d_mapiAtomToSpeciesIndex
Definition AtomicCenteredNonLocalOperator.h:670

dftfe::AtomicCenteredNonLocalOperator::copyBackFromDistributedVectorToLocalDataStructure
void copyBackFromDistributedVectorToLocalDataStructure(dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &sphericalFunctionKetTimesVectorParFlattened, const dftfe::utils::MemoryStorage< double, memorySpace > &scalingVector)
After AllReduce function is called this will copy to the nonLocalOperatorClassDatastructure.

dftfe::AtomicCenteredNonLocalOperator::getGlobalDofAtomIdSphericalFnPair
dftfe::uInt getGlobalDofAtomIdSphericalFnPair(const dftfe::uInt atomId, const dftfe::uInt alpha) const

dftfe::AtomicCenteredNonLocalOperator::applyVCconjtransOnXCellLevel
void applyVCconjtransOnXCellLevel(const dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &src, const dftfe::uInt kPointIndex, const CouplingStructure couplingtype, const dftfe::utils::MemoryStorage< ValueType, memorySpace > &couplingMatrix, dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &sphericalFunctionKetTimesVectorParFlattened, const bool flagScaleInternalMatrix=false)
completes the VCconjX on nodal vector src. The src vector must have all ghost nodes and constraint no...

dftfe::AtomicCenteredNonLocalOperator::d_numberCellsForEachAtom
std::vector< dftfe::uInt > d_numberCellsForEachAtom
Definition AtomicCenteredNonLocalOperator.h:503

dftfe::AtomicCenteredNonLocalOperator::d_atomCenteredSphericalFunctionContainer
std::shared_ptr< AtomCenteredSphericalFunctionContainer > d_atomCenteredSphericalFunctionContainer
Definition AtomicCenteredNonLocalOperator.h:499

dftfe::AtomicCenteredNonLocalOperator::initialisePartitioner
void initialisePartitioner()
creates the partitioner for the distributed vector based on sparsity patten from sphericalFn containe...

dftfe::AtomicCenteredNonLocalOperator::d_atomStartIndexGlobal
std::vector< dftfe::uInt > d_atomStartIndexGlobal
Definition AtomicCenteredNonLocalOperator.h:661

dftfe::AtomicCenteredNonLocalOperator::atomSupportInElement
bool atomSupportInElement(dftfe::uInt iElem) const

dftfe::AtomicCenteredNonLocalOperator::d_sphericalFnTimesVectorFlattenedVectorLocalIds
std::vector< dftfe::uInt > d_sphericalFnTimesVectorFlattenedVectorLocalIds
Definition AtomicCenteredNonLocalOperator.h:535

dftfe::AtomicCenteredNonLocalOperator::d_mapAtomIdToSpeciesIndex
std::vector< dftfe::uInt > d_mapAtomIdToSpeciesIndex
Definition AtomicCenteredNonLocalOperator.h:669

dftfe::AtomicCenteredNonLocalOperator::getNonTrivialSphericalFnsCellStartIndex
const std::vector< dftfe::uInt > & getNonTrivialSphericalFnsCellStartIndex() const

dftfe::AtomicCenteredNonLocalOperator::getFlattenedNonLocalCellDofIndexToProcessDofIndexMap
const dftfe::utils::MemoryStorage< dftfe::uInt, memorySpace > & getFlattenedNonLocalCellDofIndexToProcessDofIndexMap() const

dftfe::AtomicCenteredNonLocalOperator::d_CMatrixEntries
std::vector< std::vector< std::vector< dftfe::utils::MemoryStorage< ValueType, memorySpace > > > > d_CMatrixEntries
Definition AtomicCenteredNonLocalOperator.h:557

dftfe::AtomicCenteredNonLocalOperator::getNonlocalElementToCellIdVector
const std::vector< dftfe::uInt > & getNonlocalElementToCellIdVector() const

dftfe::AtomicCenteredNonLocalOperator::d_flattenedNonLocalCellDofIndexToProcessDofIndexMap
dftfe::utils::MemoryStorage< dftfe::uInt, memorySpace > d_flattenedNonLocalCellDofIndexToProcessDofIndexMap
Definition AtomicCenteredNonLocalOperator.h:657

dftfe::AtomicCenteredNonLocalOperator::applyCconjtransOnX
void applyCconjtransOnX(const dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &X)
computes the results of CconjtransX on nodal X vector

dftfe::AtomicCenteredNonLocalOperator::d_numberNodesPerElement
dftfe::uInt d_numberNodesPerElement
Definition AtomicCenteredNonLocalOperator.h:577

dftfe::AtomicCenteredNonLocalOperator::d_isMallocCalled
bool d_isMallocCalled
Definition AtomicCenteredNonLocalOperator.h:583

dftfe::AtomicCenteredNonLocalOperator::d_mpiPatternP2P
std::shared_ptr< const utils::mpi::MPIPatternP2P< dftfe::utils::MemorySpace::HOST > > d_mpiPatternP2P
Definition AtomicCenteredNonLocalOperator.h:502

dftfe::AtomicCenteredNonLocalOperator::applyCconjtransOnX
void applyCconjtransOnX(const ValueType *X, const std::pair< dftfe::uInt, dftfe::uInt > cellRange)
computes the results of CconjtransX on the cells of interst specied by cellRange

dftfe::AtomicCenteredNonLocalOperator::getAtomWiseNumberCellsAccumulated
std::vector< dftfe::uInt > & getAtomWiseNumberCellsAccumulated() const

dftfe::AtomicCenteredNonLocalOperator::d_totalNonLocalEntries
dftfe::uInt d_totalNonLocalEntries
Definition AtomicCenteredNonLocalOperator.h:570

dftfe::AtomicCenteredNonLocalOperator::initialiseOperatorActionOnX
void initialiseOperatorActionOnX(dftfe::uInt kPointIndex)
Resizes various internal data members and selects the kpoint of interest.

dftfe::AtomicCenteredNonLocalOperator::pcout
dealii::ConditionalOStream pcout
Definition AtomicCenteredNonLocalOperator.h:558

dftfe::AtomicCenteredNonLocalOperator::initialiseFlattenedDataStructure
void initialiseFlattenedDataStructure(dftfe::uInt waveFunctionBlockSize, dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &sphericalFunctionKetTimesVectorParFlattened)
initialises the multivector object, waveFunctionBlockSize and resizes various internal data members.

dftfe::AtomicCenteredNonLocalOperator::applyCOnVCconjtransX
void applyCOnVCconjtransX(ValueType *Xout, const std::pair< dftfe::uInt, dftfe::uInt > cellRange)
adds the result of CVCtX onto Xout for both CPU and GPU calls

dftfe::AtomicCenteredNonLocalOperator::d_mapIAtomicNumToDotProd
std::vector< dftfe::uInt > d_mapIAtomicNumToDotProd
Definition AtomicCenteredNonLocalOperator.h:673

dftfe::AtomicCenteredNonLocalOperator::applyCVCconjtransOnX
void applyCVCconjtransOnX(const dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &src, const dftfe::uInt kPointIndex, const CouplingStructure couplingtype, const dftfe::utils::MemoryStorage< ValueType, memorySpace > &couplingMatrix, dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &sphericalFunctionKetTimesVectorParFlattened, dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &dst)
completes the action of CVCconjtranspose on nodal vector src. The src vector must have all ghost node...

dftfe::AtomicCenteredNonLocalOperator::getCellIdToAtomIdsLocalCompactSupportMap
const std::map< dftfe::uInt, std::vector< dftfe::uInt > > & getCellIdToAtomIdsLocalCompactSupportMap() const

dftfe::AtomicCenteredNonLocalOperator::applyVCconjtransOnXUsingGlobalC
void applyVCconjtransOnXUsingGlobalC(const dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &src, const dftfe::uInt kPointIndex, const CouplingStructure couplingtype, const dftfe::utils::MemoryStorage< ValueType, memorySpace > &couplingMatrix, dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &sphericalFunctionKetTimesVectorParFlattened, const bool flagScaleInternalMatrix=false)
completes the VCconjX on nodal vector src using global C matrix. The global C matrix mush have been c...

dftfe::AtomicCenteredNonLocalOperator::getCconjtansXLocalDataStructure
const ValueType * getCconjtansXLocalDataStructure(const dftfe::uInt iAtom) const
Returns the pointer of CTX stored in HOST memory.

dftfe::AtomicCenteredNonLocalOperator::getTotalNonTrivialSphericalFnsOverAllCells
const dftfe::uInt getTotalNonTrivialSphericalFnsOverAllCells() const

dftfe::AtomicCenteredNonLocalOperator::applyVOnCconjtransX
void applyVOnCconjtransX(const CouplingStructure couplingtype, const dftfe::utils::MemoryStorage< ValueType, memorySpace > &couplingMatrix, dftfe::linearAlgebra::MultiVector< ValueType, memorySpace > &sphericalFunctionKetTimesVectorParFlattened, const bool flagCopyResultsToMatrix=true, const dftfe::uInt kPointIndex=0)
compute the action of coupling matrix on sphericalFunctionKetTimesVectorParFlattened.

dftfe::AtomicCenteredNonLocalOperator::getNonTrivialSphericalFnsPerCell
const std::vector< dftfe::uInt > & getNonTrivialSphericalFnsPerCell() const

dftfe::AtomicCenteredNonLocalOperator::d_sphericalFunctionIdsNumberingMapCurrentProcess
std::map< std::pair< dftfe::uInt, dftfe::uInt >, dftfe::uInt > d_sphericalFunctionIdsNumberingMapCurrentProcess
Definition AtomicCenteredNonLocalOperator.h:548

dftfe::AtomicCenteredNonLocalOperator::d_OwnedAtomIdsInCurrentProcessor
std::vector< dftfe::uInt > d_OwnedAtomIdsInCurrentProcessor
Definition AtomicCenteredNonLocalOperator.h:550

dftfe::AtomicCenteredNonLocalOperator::d_nonTrivialAllCellsSphericalFnAlphaToElemIdMap
std::vector< dftfe::uInt > d_nonTrivialAllCellsSphericalFnAlphaToElemIdMap
Definition AtomicCenteredNonLocalOperator.h:527

dftfe::AtomicCenteredNonLocalOperator::d_kPointCoordinates
std::vector< double > d_kPointCoordinates
Definition AtomicCenteredNonLocalOperator.h:495

dftfe::AtomicCenteredNonLocalOperator::getMaxSingleAtomEntries
dftfe::uInt getMaxSingleAtomEntries() const

dftfe::AtomicCenteredNonLocalOperator::d_memoryOptMode
bool d_memoryOptMode
Definition AtomicCenteredNonLocalOperator.h:582

dftfe::AtomicCenteredNonLocalOperator::getGlobalCMatrix
const std::vector< std::vector< dftfe::utils::MemoryStorage< ValueType, memorySpace > > > & getGlobalCMatrix() const
Returns global C matrix of all atoms.

dftfe::AtomicCenteredNonLocalOperator::copyGlobalCMatrix
void copyGlobalCMatrix(const std::shared_ptr< AtomicCenteredNonLocalOperator< ValueTypeSrc, memorySpace > > nonLocalOperatorSrc, std::shared_ptr< dftfe::basis::FEBasisOperations< dataTypes::number, double, dftfe::utils::MemorySpace::HOST > > basisOperationsPtr, const dftfe::uInt quadratureIndex)

dftfe::AtomicCenteredNonLocalOperator::getLocalIdOfDistributedVec
dftfe::uInt getLocalIdOfDistributedVec(const dftfe::uInt globalId) const

dftfe::AtomicCenteredNonLocalOperator::getCmatrixEntriesTranspose
const std::vector< ValueType > & getCmatrixEntriesTranspose(const dftfe::uInt chargeId, const dftfe::uInt iElemComp) const
Returns C conj matrix entries for chargeId and it compact support element Id.

dftfe::AtomicCenteredNonLocalOperator::d_this_mpi_process
const dftfe::uInt d_this_mpi_process
Definition AtomicCenteredNonLocalOperator.h:560

dftfe::AtomicCenteredNonLocalOperator::getTotalNonLocalEntriesCurrentProcessor
dftfe::uInt getTotalNonLocalEntriesCurrentProcessor() const

dftfe::AtomicCenteredNonLocalOperator::computeGlobalCMatrixVector
void computeGlobalCMatrixVector(std::shared_ptr< dftfe::basis::FEBasisOperations< dataTypes::number, double, dftfe::utils::MemorySpace::HOST > > basisOperationsPtr, std::shared_ptr< dftfe::linearAlgebra::BLASWrapper< dftfe::utils::MemorySpace::HOST > > BLASWrapperHostPtr)
computes Global Cmatrix on HOST.

dftfe::AtomicCenteredNonLocalOperator::d_locallyOwnedSphericalFunctionIdsCurrentProcess
dealii::IndexSet d_locallyOwnedSphericalFunctionIdsCurrentProcess
Definition AtomicCenteredNonLocalOperator.h:562

dftfe::AtomicCenteredNonLocalOperator::computeCconjtransCMatrix
void computeCconjtransCMatrix(const dftfe::uInt atomId, std::shared_ptr< dftfe::linearAlgebra::BLASWrapper< dftfe::utils::MemorySpace::HOST > > BLASWrapperPtr, const dftfe::utils::MemoryStorage< double, dftfe::utils::MemorySpace::HOST > &Dinverse, dftfe::utils::MemoryStorage< ValueType, dftfe::utils::MemorySpace::HOST > PconjtransposePmatrix)
Computes C^{T}D^{-1}C at the global level for atomId. This is required in PAW.

dftfe::AtomicCenteredNonLocalOperator::getTotalNonLocalElementsInCurrentProcessor
dftfe::uInt getTotalNonLocalElementsInCurrentProcessor() const

dftfe::AtomicCenteredNonLocalOperator::getNonLocalElemIdToLocalElemIdMap
std::vector< dftfe::uInt > & getNonLocalElemIdToLocalElemIdMap() const

dftfe::AtomicCenteredNonLocalOperator::d_atomCenteredKpointTimesSphericalFnTimesDistFromAtomQuadValues
std::vector< ValueType > d_atomCenteredKpointTimesSphericalFnTimesDistFromAtomQuadValues
Definition AtomicCenteredNonLocalOperator.h:514

dftfe::AtomicCenteredNonLocalOperator::d_ghostAtomCenteredFnIdsCurrentProcess
dealii::IndexSet d_ghostAtomCenteredFnIdsCurrentProcess
Definition AtomicCenteredNonLocalOperator.h:552

dftfe::AtomicCenteredNonLocalOperator::d_totalNonlocalElems
dftfe::uInt d_totalNonlocalElems
Definition AtomicCenteredNonLocalOperator.h:568

dftfe::basis::FEBasisOperations
Definition FEBasisOperations.h:85

dftfe::linearAlgebra::BLASWrapper
Definition BLASWrapper.h:35

dftfe::linearAlgebra::MultiVector
An class template to encapsulate a MultiVector. A MultiVector is a collection of  vectors belonging t...
Definition MultiVector.h:127

dftfe::utils::MemoryStorage
Definition MemoryStorage.h:33

dftfe::utils::mpi::MPIPatternP2P
A class template to store the communication pattern (i.e., which entries/nodes to receive from which ...
Definition MPIPatternP2P.h:57

dftUtils.h

headers.h

linearAlgebraOperations.h

dftfe::dataTypes::number
double number
Definition dftfeDataTypes.h:42

dftfe::utils::MemorySpace::HOST
@ HOST
Definition MemorySpaceType.h:34

dftfe
Definition pseudoPotentialToDftfeConverter.cc:34

dftfe::CouplingStructure
CouplingStructure
Enum class that lists used in the non-local Operator.
Definition AtomicCenteredNonLocalOperator.h:48

dftfe::CouplingStructure::dense
@ dense
Definition AtomicCenteredNonLocalOperator.h:50

dftfe::CouplingStructure::blockDiagonal
@ blockDiagonal
Definition AtomicCenteredNonLocalOperator.h:51

dftfe::CouplingStructure::diagonal
@ diagonal
Definition AtomicCenteredNonLocalOperator.h:49

dftfe::uInt
std::uint32_t uInt
Definition TypeConfig.h:10

dftfe::Int
std::int32_t Int
Definition TypeConfig.h:11

pseudoUtils.h

sphericalHarmonicUtils.h

vectorUtilities.h