Scalapack wrapper adapted from dealii library and extended implementation to complex datatype. More...

#include <scalapackWrapper.h>

Public Types
using	size_type = unsigned int

Public Member Functions
	ScaLAPACKMatrix (const size_type n_rows, const size_type n_columns, const std::shared_ptr< const dftfe::ProcessGrid > &process_grid, const size_type row_block_size=32, const size_type column_block_size=32, const dftfe::LAPACKSupport::Property property=dftfe::LAPACKSupport::Property::general)

	ScaLAPACKMatrix (const size_type size, const std::shared_ptr< const dftfe::ProcessGrid > &process_grid, const size_type block_size=32, const dftfe::LAPACKSupport::Property property=dftfe::LAPACKSupport::Property::hermitian)

void	reinit (const size_type n_rows, const size_type n_columns, const std::shared_ptr< const dftfe::ProcessGrid > &process_grid, const size_type row_block_size=32, const size_type column_block_size=32, const dftfe::LAPACKSupport::Property property=dftfe::LAPACKSupport::Property::general)

void	reinit (const size_type size, const std::shared_ptr< const dftfe::ProcessGrid > &process_grid, const size_type block_size=32, const dftfe::LAPACKSupport::Property property=dftfe::LAPACKSupport::Property::hermitian)

void	set_property (const dftfe::LAPACKSupport::Property property)

dftfe::LAPACKSupport::Property	get_property () const

dftfe::LAPACKSupport::State	get_state () const

void	copy_to (ScaLAPACKMatrix< NumberType > &dest) const

void	conjugate ()

void	add (const ScaLAPACKMatrix< NumberType > &B, const NumberType a=0., const NumberType b=1., const bool transpose_B=false)

void	zadd (const ScaLAPACKMatrix< NumberType > &B, const NumberType a=0., const NumberType b=1., const bool conjugate_transpose_B=false)

void	copy_transposed (const ScaLAPACKMatrix< NumberType > &B)

void	copy_conjugate_transposed (const ScaLAPACKMatrix< NumberType > &B)

void	mult (const NumberType b, const ScaLAPACKMatrix< NumberType > &B, const NumberType c, ScaLAPACKMatrix< NumberType > &C, const bool transpose_A=false, const bool transpose_B=false) const

void	zmult (const NumberType b, const ScaLAPACKMatrix< NumberType > &B, const NumberType c, ScaLAPACKMatrix< NumberType > &C, const bool conjugate_transpose_A=false, const bool conjugate_transpose_B=false) const

void	mmult (ScaLAPACKMatrix< NumberType > &C, const ScaLAPACKMatrix< NumberType > &B, const bool adding=false) const

void	Tmmult (ScaLAPACKMatrix< NumberType > &C, const ScaLAPACKMatrix< NumberType > &B, const bool adding=false) const

void	mTmult (ScaLAPACKMatrix< NumberType > &C, const ScaLAPACKMatrix< NumberType > &B, const bool adding=false) const

void	TmTmult (ScaLAPACKMatrix< NumberType > &C, const ScaLAPACKMatrix< NumberType > &B, const bool adding=false) const

void	zmmult (ScaLAPACKMatrix< NumberType > &C, const ScaLAPACKMatrix< NumberType > &B, const bool adding=false) const

void	zCmmult (ScaLAPACKMatrix< NumberType > &C, const ScaLAPACKMatrix< NumberType > &B, const bool adding=false) const

void	zmCmult (ScaLAPACKMatrix< NumberType > &C, const ScaLAPACKMatrix< NumberType > &B, const bool adding=false) const

void	zCmCmult (ScaLAPACKMatrix< NumberType > &C, const ScaLAPACKMatrix< NumberType > &B, const bool adding=false) const

size_type	m () const

size_type	n () const

unsigned int	local_m () const

unsigned int	local_n () const

unsigned int	global_row (const unsigned int loc_row) const

unsigned int	global_column (const unsigned int loc_column) const

NumberType	local_el (const unsigned int loc_row, const unsigned int loc_column) const

NumberType &	local_el (const unsigned int loc_row, const unsigned int loc_column)

void	compute_cholesky_factorization ()

void	compute_lu_factorization ()

void	invert ()

void	scale_columns (const std::vector< NumberType > &factors)

void	scale_rows (const std::vector< NumberType > &factors)

void	scale_columns_realfactors (const std::vector< double > &factors)

void	scale_rows_realfactors (const std::vector< double > &factors)

std::vector< double >	eigenpairs_hermitian_by_index (const std::pair< unsigned int, unsigned int > &index_limits, const bool compute_eigenvectors)

std::vector< double >	eigenpairs_hermitian_by_index_MRRR (const std::pair< unsigned int, unsigned int > &index_limits, const bool compute_eigenvectors)

Private Member Functions
std::vector< double >	eigenpairs_hermitian (const bool compute_eigenvectors, const std::pair< unsigned int, unsigned int > &index_limits=std::make_pair(dealii::numbers::invalid_unsigned_int, dealii::numbers::invalid_unsigned_int), const std::pair< double, double > &value_limits=std::make_pair(std::numeric_limits< double >::quiet_NaN(), std::numeric_limits< double >::quiet_NaN()))

std::vector< double >	eigenpairs_hermitian_MRRR (const bool compute_eigenvectors, const std::pair< unsigned int, unsigned int > &index_limits=std::make_pair(dealii::numbers::invalid_unsigned_int, dealii::numbers::invalid_unsigned_int), const std::pair< double, double > &value_limits=std::make_pair(std::numeric_limits< double >::quiet_NaN(), std::numeric_limits< double >::quiet_NaN()))

Private Attributes
std::vector< NumberType >	values

dftfe::LAPACKSupport::State	state

dftfe::LAPACKSupport::Property	property

std::shared_ptr< const dftfe::ProcessGrid >	grid

int	n_rows

int	n_columns

int	row_block_size

int	column_block_size

int	n_local_rows

int	n_local_columns

int	descriptor [9]

std::vector< NumberType >	work

std::vector< int >	iwork

std::vector< int >	ipiv

const char	uplo

const int	first_process_row

const int	first_process_column

const int	submatrix_row

const int	submatrix_column

dealii::Threads::Mutex	mutex

Detailed Description

template<typename NumberType>
class dftfe::ScaLAPACKMatrix< NumberType >

Scalapack wrapper adapted from dealii library and extended implementation to complex datatype.

Author: Sambit Das

Member Typedef Documentation

◆ size_type

template<typename NumberType>

using dftfe::ScaLAPACKMatrix< NumberType >::size_type = unsigned int

Declare the type for container size.

Constructor & Destructor Documentation

◆ ScaLAPACKMatrix() [1/2]

template<typename NumberType>

dftfe::ScaLAPACKMatrix< NumberType >::ScaLAPACKMatrix	(	const size_type	n_rows,
		const size_type	n_columns,
		const std::shared_ptr< const dftfe::ProcessGrid > &	process_grid,
		const size_type	row_block_size = 32,
		const size_type	column_block_size = 32,
		const dftfe::LAPACKSupport::Property	property = dftfe::LAPACKSupport::Property::general )

Constructor for a rectangular matrix with n_rows and n_cols and distributed using the grid process_grid.

The parameters row_block_size and column_block_size are the block sizes used for the block-cyclic distribution of the matrix. In general, it is recommended to use powers of $2$, e.g. $16,32,64, \dots$.

◆ ScaLAPACKMatrix() [2/2]

template<typename NumberType>

dftfe::ScaLAPACKMatrix< NumberType >::ScaLAPACKMatrix	(	const size_type	size,
		const std::shared_ptr< const dftfe::ProcessGrid > &	process_grid,
		const size_type	block_size = 32,
		const dftfe::LAPACKSupport::Property	property = dftfe::LAPACKSupport::Property::hermitian )

Constructor for a square matrix of size size, and distributed using the process grid in process_grid.

The parameter block_size is used for the block-cyclic distribution of the matrix. An identical block size is used for the rows and columns of the matrix. In general, it is recommended to use powers of $2$, e.g. $16,32,64, \dots$.

Member Function Documentation

◆ add()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::add	(	const ScaLAPACKMatrix< NumberType > &	B,
		const NumberType	a = 0.,
		const NumberType	b = 1.,
		const bool	transpose_B = false )

The operations based on the input parameter transpose_B and the alignment conditions are summarized in the following table:

transpose_B	Block Sizes	Operation
false	$MB_A=MB_B$ $NB_A=NB_B$	$\mathbf{A} = a \mathbf{A} + b \mathbf{B}$
true	$MB_A=NB_B$ $NB_A=MB_B$	$\mathbf{A} = a \mathbf{A} + b \mathbf{B}^T$

The matrices $\mathbf{A}$ and $\mathbf{B}$ must have the same process grid.

◆ compute_cholesky_factorization()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::compute_cholesky_factorization ( )

Compute the Cholesky factorization of the matrix using ScaLAPACK function pXpotrf. The result of the factorization is stored in this object.

◆ compute_lu_factorization()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::compute_lu_factorization ( )

Compute the LU factorization of the matrix using ScaLAPACK function pXgetrf and partial pivoting with row interchanges. The result of the factorization is stored in this object.

◆ conjugate()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::conjugate ( )

Complex conjugate.

◆ copy_conjugate_transposed()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::copy_conjugate_transposed ( const ScaLAPACKMatrix< NumberType > & B )

Transposing assignment: $\mathbf{A} = \mathbf{B}^C$

The matrices $\mathbf{A}$ and $\mathbf{B}$ must have the same process grid.

The following alignment conditions have to be fulfilled: $MB_A=NB_B$ and $NB_A=MB_B$.

◆ copy_to()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::copy_to ( ScaLAPACKMatrix< NumberType > & dest ) const

Copy the contents of the distributed matrix into a differently distributed matrix dest. The function also works for matrices with different process grids or block-cyclic distributions.

◆ copy_transposed()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::copy_transposed ( const ScaLAPACKMatrix< NumberType > & B )

Transposing assignment: $\mathbf{A} = \mathbf{B}^T$

The matrices $\mathbf{A}$ and $\mathbf{B}$ must have the same process grid.

The following alignment conditions have to be fulfilled: $MB_A=NB_B$ and $NB_A=MB_B$.

◆ eigenpairs_hermitian()

template<typename NumberType>

std::vector< double > dftfe::ScaLAPACKMatrix< NumberType >::eigenpairs_hermitian	(	const bool	compute_eigenvectors,
		const std::pair< unsigned int, unsigned int > &	index_limits = std::make_pair(dealii::numbers::invalid_unsigned_int, dealii::numbers::invalid_unsigned_int),
		const std::pair< double, double > &	value_limits = std::make_pair(std::numeric_limits< double >::quiet_NaN(), std::numeric_limits< double >::quiet_NaN()) )

private

Computing selected eigenvalues and, optionally, the eigenvectors. The eigenvalues/eigenvectors are selected by either prescribing a range of indices index_limits or a range of values value_limits for the eigenvalues. The function will throw an exception if both ranges are prescribed (meaning that both ranges differ from the default value) as this ambiguity is prohibited. If successful, the computed eigenvalues are arranged in ascending order. The eigenvectors are stored in the columns of the matrix, thereby overwriting the original content of the matrix.

◆ eigenpairs_hermitian_by_index()

template<typename NumberType>

std::vector< double > dftfe::ScaLAPACKMatrix< NumberType >::eigenpairs_hermitian_by_index	(	const std::pair< unsigned int, unsigned int > &	index_limits,
		const bool	compute_eigenvectors )

Computing selected eigenvalues and, optionally, the eigenvectors of the real hermitian matrix $\mathbf{A} \in \mathbb{R}^{M \times M}$.

The eigenvalues/eigenvectors are selected by prescribing a range of indices index_limits.

If successful, the computed eigenvalues are arranged in ascending order. The eigenvectors are stored in the columns of the matrix, thereby overwriting the original content of the matrix.

If all eigenvalues/eigenvectors have to be computed, pass the closed interval $ \left[ 0, M-1 \right] $ in index_limits.

Pass the closed interval $ \left[ M-r, M-1 \right] $ if the $r$ largest eigenvalues/eigenvectors are desired.

◆ eigenpairs_hermitian_by_index_MRRR()

template<typename NumberType>

std::vector< double > dftfe::ScaLAPACKMatrix< NumberType >::eigenpairs_hermitian_by_index_MRRR	(	const std::pair< unsigned int, unsigned int > &	index_limits,
		const bool	compute_eigenvectors )

Computing selected eigenvalues and, optionally, the eigenvectors of the real hermitian matrix $\mathbf{A} \in \mathbb{R}^{M \times M}$ using the MRRR algorithm.

The eigenvalues/eigenvectors are selected by prescribing a range of indices index_limits.

If successful, the computed eigenvalues are arranged in ascending order. The eigenvectors are stored in the columns of the matrix, thereby overwriting the original content of the matrix.

If all eigenvalues/eigenvectors have to be computed, pass the closed interval $ \left[ 0, M-1 \right] $ in index_limits.

Pass the closed interval $ \left[ M-r, M-1 \right] $ if the $r$ largest eigenvalues/eigenvectors are desired.

◆ eigenpairs_hermitian_MRRR()

template<typename NumberType>

std::vector< double > dftfe::ScaLAPACKMatrix< NumberType >::eigenpairs_hermitian_MRRR	(	const bool	compute_eigenvectors,
		const std::pair< unsigned int, unsigned int > &	index_limits = std::make_pair(dealii::numbers::invalid_unsigned_int, dealii::numbers::invalid_unsigned_int),
		const std::pair< double, double > &	value_limits = std::make_pair(std::numeric_limits< double >::quiet_NaN(), std::numeric_limits< double >::quiet_NaN()) )

private

Computing selected eigenvalues and, optionally, the eigenvectors of the real hermitian matrix $\mathbf{A} \in \mathbb{R}^{M \times M}$ using the MRRR algorithm. The eigenvalues/eigenvectors are selected by either prescribing a range of indices index_limits or a range of values value_limits for the eigenvalues. The function will throw an exception if both ranges are prescribed (meaning that both ranges differ from the default value) as this ambiguity is prohibited.

By calling this function the original content of the matrix will be overwritten. If requested, the eigenvectors are stored in the columns of the matrix. Also in the case that just the eigenvalues are required, the content of the matrix will be overwritten.

If successful, the computed eigenvalues are arranged in ascending order.

Note: Due to a bug in Netlib-ScaLAPACK, either all or no eigenvectors can be computed. Therefore, the input index_limits has to be set accordingly. Using Intel-MKL this restriction is not required.

◆ get_property()

template<typename NumberType>

dftfe::LAPACKSupport::Property dftfe::ScaLAPACKMatrix< NumberType >::get_property ( ) const

Return current property of this matrix

◆ get_state()

template<typename NumberType>

dftfe::LAPACKSupport::State dftfe::ScaLAPACKMatrix< NumberType >::get_state ( ) const

Return current state of this matrix

◆ global_column()

template<typename NumberType>

unsigned int dftfe::ScaLAPACKMatrix< NumberType >::global_column ( const unsigned int loc_column ) const

Return the global column number for the given local column loc_column.

◆ global_row()

template<typename NumberType>

unsigned int dftfe::ScaLAPACKMatrix< NumberType >::global_row ( const unsigned int loc_row ) const

Return the global row number for the given local row loc_row .

◆ invert()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::invert ( )

Invert the matrix by first computing a Cholesky for hermitian matrices or a LU factorization for general matrices and then building the actual inverse using pXpotri or pXgetri. If the matrix is triangular, the LU factorization step is skipped, and pXtrtri is used directly.

If a Cholesky or LU factorization has been applied previously, pXpotri or pXgetri are called directly.

The inverse is stored in this object.

◆ local_el() [1/2]

template<typename NumberType>

NumberType & dftfe::ScaLAPACKMatrix< NumberType >::local_el	(	const unsigned int	loc_row,
		const unsigned int	loc_column )

inline

Write access to local element.

◆ local_el() [2/2]

template<typename NumberType>

NumberType dftfe::ScaLAPACKMatrix< NumberType >::local_el	(	const unsigned int	loc_row,
		const unsigned int	loc_column ) const

inline

Read access to local element.

◆ local_m()

template<typename NumberType>

unsigned int dftfe::ScaLAPACKMatrix< NumberType >::local_m ( ) const

Number of local rows on this MPI processes.

◆ local_n()

template<typename NumberType>

unsigned int dftfe::ScaLAPACKMatrix< NumberType >::local_n ( ) const

Number of local columns on this MPI process.

◆ m()

template<typename NumberType>

unsigned int dftfe::ScaLAPACKMatrix< NumberType >::m ( ) const

inline

Number of rows of the $M \times N$ matrix.

◆ mmult()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::mmult	(	ScaLAPACKMatrix< NumberType > &	C,
		const ScaLAPACKMatrix< NumberType > &	B,
		const bool	adding = false ) const

Matrix-matrix-multiplication.

The optional parameter adding determines whether the result is stored in $\mathbf{C}$ or added to $\mathbf{C}$.

if (adding) $\mathbf{C} = \mathbf{C} + \mathbf{A} \cdot \mathbf{B}$

else $\mathbf{C} = \mathbf{A} \cdot \mathbf{B}$

It is assumed that $\mathbf{A}$ and $\mathbf{B}$ have compatible sizes and that $\mathbf{C}$ already has the right size.

The following alignment conditions have to be fulfilled: $MB_A=MB_C$, $NB_A=MB_B$ and $NB_B=NB_C$.

◆ mTmult()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::mTmult	(	ScaLAPACKMatrix< NumberType > &	C,
		const ScaLAPACKMatrix< NumberType > &	B,
		const bool	adding = false ) const

Matrix-matrix-multiplication using the transpose of $\mathbf{B}$.

The optional parameter adding determines whether the result is stored in $\mathbf{C}$ or added to $\mathbf{C}$.

if (adding) $\mathbf{C} = \mathbf{C} + \mathbf{A} \cdot \mathbf{B}^T$

else $\mathbf{C} = \mathbf{A} \cdot \mathbf{B}^T$

It is assumed that $\mathbf{A}$ and $\mathbf{B}$ have compatible sizes and that $\mathbf{C}$ already has the right size.

The following alignment conditions have to be fulfilled: $MB_A=MB_C$, $NB_A=NB_B$ and $MB_B=NB_C$.

◆ mult()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::mult	(	const NumberType	b,
		const ScaLAPACKMatrix< NumberType > &	B,
		const NumberType	c,
		ScaLAPACKMatrix< NumberType > &	C,
		const bool	transpose_A = false,
		const bool	transpose_B = false ) const

Matrix-matrix-multiplication:

The operations based on the input parameters and the alignment conditions are summarized in the following table:

transpose_A	transpose_B	Block Sizes	Operation
false	false	$MB_A=MB_C$ $NB_A=MB_B$ $NB_B=NB_C$	$\mathbf{C} = b \mathbf{A} \cdot \mathbf{B} + c \mathbf{C}$
false	true	$MB_A=MB_C$ $NB_A=NB_B$ $MB_B=NB_C$	$\mathbf{C} = b \mathbf{A} \cdot \mathbf{B}^T + c \mathbf{C}$
true	false	$MB_A=MB_B$ $NB_A=MB_C$ $NB_B=NB_C$	$\mathbf{C} = b \mathbf{A}^T \cdot \mathbf{B} + c \mathbf{C}$
true	true	$MB_A=NB_B$ $NB_A=MB_C$ $MB_B=NB_C$	$\mathbf{C} = b \mathbf{A}^T \cdot \mathbf{B}^T + c \mathbf{C}$

It is assumed that $\mathbf{A}$ and $\mathbf{B}$ have compatible sizes and that $\mathbf{C}$ already has the right size.

The matrices $\mathbf{A}$, $\mathbf{B}$ and $\mathbf{C}$ must have the same process grid.

◆ n()

template<typename NumberType>

unsigned int dftfe::ScaLAPACKMatrix< NumberType >::n ( ) const

inline

Number of columns of the $M \times N$ matrix.

◆ reinit() [1/2]

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::reinit	(	const size_type	n_rows,
		const size_type	n_columns,
		const std::shared_ptr< const dftfe::ProcessGrid > &	process_grid,
		const size_type	row_block_size = 32,
		const size_type	column_block_size = 32,
		const dftfe::LAPACKSupport::Property	property = dftfe::LAPACKSupport::Property::general )

Initialize the rectangular matrix with n_rows and n_cols and distributed using the grid process_grid.

The parameters row_block_size and column_block_size are the block sizes used for the block-cyclic distribution of the matrix. In general, it is recommended to use powers of $2$, e.g. $16,32,64, \dots$.

◆ reinit() [2/2]

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::reinit	(	const size_type	size,
		const std::shared_ptr< const dftfe::ProcessGrid > &	process_grid,
		const size_type	block_size = 32,
		const dftfe::LAPACKSupport::Property	property = dftfe::LAPACKSupport::Property::hermitian )

Initialize the square matrix of size size and distributed using the grid process_grid.

The parameter block_size is used for the block-cyclic distribution of the matrix. An identical block size is used for the rows and columns of the matrix. In general, it is recommended to use powers of $2$, e.g. $16,32,64, \dots$.

◆ scale_columns()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::scale_columns ( const std::vector< NumberType > & factors )

Scale the columns of the distributed matrix by the scalars provided in the array factors.

The array factors must have as many entries as the matrix columns.

Copies of factors have to be available on all processes of the underlying MPI communicator.

◆ scale_columns_realfactors()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::scale_columns_realfactors ( const std::vector< double > & factors )

Scale the columns of the distributed matrix by the scalars provided in the array factors.

The array factors must have as many entries as the matrix columns.

Copies of factors have to be available on all processes of the underlying MPI communicator.

◆ scale_rows()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::scale_rows ( const std::vector< NumberType > & factors )

Scale the rows of the distributed matrix by the scalars provided in the array factors.

The array factors must have as many entries as the matrix rows.

Copies of factors have to be available on all processes of the underlying MPI communicator.

◆ scale_rows_realfactors()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::scale_rows_realfactors ( const std::vector< double > & factors )

Scale the rows of the distributed matrix by the scalars provided in the array factors.

The array factors must have as many entries as the matrix rows.

Copies of factors have to be available on all processes of the underlying MPI communicator.

◆ set_property()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::set_property ( const dftfe::LAPACKSupport::Property property )

Assign property to this matrix.

◆ Tmmult()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::Tmmult	(	ScaLAPACKMatrix< NumberType > &	C,
		const ScaLAPACKMatrix< NumberType > &	B,
		const bool	adding = false ) const

Matrix-matrix-multiplication using transpose of $\mathbf{A}$.

The optional parameter adding determines whether the result is stored in $\mathbf{C}$ or added to $\mathbf{C}$.

if (adding) $\mathbf{C} = \mathbf{C} + \mathbf{A}^T \cdot \mathbf{B}$

else $\mathbf{C} = \mathbf{A}^T \cdot \mathbf{B}$

It is assumed that $\mathbf{A}$ and $\mathbf{B}$ have compatible sizes and that $\mathbf{C}$ already has the right size.

The following alignment conditions have to be fulfilled: $MB_A=MB_B$, $NB_A=MB_C$ and $NB_B=NB_C$.

◆ TmTmult()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::TmTmult	(	ScaLAPACKMatrix< NumberType > &	C,
		const ScaLAPACKMatrix< NumberType > &	B,
		const bool	adding = false ) const

Matrix-matrix-multiplication using transpose of $\mathbf{A}$ and $\mathbf{B}$.

The optional parameter adding determines whether the result is stored in $\mathbf{C}$ or added to $\mathbf{C}$.

if (adding) $\mathbf{C} = \mathbf{C} + \mathbf{A}^T \cdot \mathbf{B}^T$

else $\mathbf{C} = \mathbf{A}^T \cdot \mathbf{B}^T$

It is assumed that $\mathbf{A}$ and $\mathbf{B}$ have compatible sizes and that $\mathbf{C}$ already has the right size.

The following alignment conditions have to be fulfilled: $MB_A=NB_B$, $NB_A=MB_C$ and $MB_B=NB_C$.

◆ zadd()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::zadd	(	const ScaLAPACKMatrix< NumberType > &	B,
		const NumberType	a = 0.,
		const NumberType	b = 1.,
		const bool	conjugate_transpose_B = false )

The operations based on the input parameter conjugate_transpose_B and the alignment conditions are summarized in the following table:

transpose_B	Block Sizes	Operation
false	$MB_A=MB_B$ $NB_A=NB_B$	$\mathbf{A} = a \mathbf{A} + b \mathbf{B}$
true	$MB_A=NB_B$ $NB_A=MB_B$	$\mathbf{A} = a \mathbf{A} + b \mathbf{B}^C$

The matrices $\mathbf{A}$ and $\mathbf{B}$ must have the same process grid.

◆ zCmCmult()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::zCmCmult	(	ScaLAPACKMatrix< NumberType > &	C,
		const ScaLAPACKMatrix< NumberType > &	B,
		const bool	adding = false ) const

Matrix-matrix-multiplication using conjugate transpose of $\mathbf{A}$ and $\mathbf{B}$.

The optional parameter adding determines whether the result is stored in $\mathbf{C}$ or added to $\mathbf{C}$.

if (adding) $\mathbf{C} = \mathbf{C} + \mathbf{A}^C \cdot \mathbf{B}^T$

else $\mathbf{C} = \mathbf{A}^C \cdot \mathbf{B}^C$

It is assumed that $\mathbf{A}$ and $\mathbf{B}$ have compatible sizes and that $\mathbf{C}$ already has the right size.

The following alignment conditions have to be fulfilled: $MB_A=NB_B$, $NB_A=MB_C$ and $MB_B=NB_C$.

◆ zCmmult()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::zCmmult	(	ScaLAPACKMatrix< NumberType > &	C,
		const ScaLAPACKMatrix< NumberType > &	B,
		const bool	adding = false ) const

Matrix-matrix-multiplication using conjugate transpose of $\mathbf{A}$.

The optional parameter adding determines whether the result is stored in $\mathbf{C}$ or added to $\mathbf{C}$.

if (adding) $\mathbf{C} = \mathbf{C} + \mathbf{A}^C \cdot \mathbf{B}$

else $\mathbf{C} = \mathbf{A}^C \cdot \mathbf{B}$

It is assumed that $\mathbf{A}$ and $\mathbf{B}$ have compatible sizes and that $\mathbf{C}$ already has the right size.

The following alignment conditions have to be fulfilled: $MB_A=MB_B$, $NB_A=MB_C$ and $NB_B=NB_C$.

◆ zmCmult()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::zmCmult	(	ScaLAPACKMatrix< NumberType > &	C,
		const ScaLAPACKMatrix< NumberType > &	B,
		const bool	adding = false ) const

Matrix-matrix-multiplication using the conjugate transpose of $\mathbf{B}$.

The optional parameter adding determines whether the result is stored in $\mathbf{C}$ or added to $\mathbf{C}$.

if (adding) $\mathbf{C} = \mathbf{C} + \mathbf{A} \cdot \mathbf{B}^C$

else $\mathbf{C} = \mathbf{A} \cdot \mathbf{B}^C$

It is assumed that $\mathbf{A}$ and $\mathbf{B}$ have compatible sizes and that $\mathbf{C}$ already has the right size.

The following alignment conditions have to be fulfilled: $MB_A=MB_C$, $NB_A=NB_B$ and $MB_B=NB_C$.

◆ zmmult()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::zmmult	(	ScaLAPACKMatrix< NumberType > &	C,
		const ScaLAPACKMatrix< NumberType > &	B,
		const bool	adding = false ) const

Matrix-matrix-multiplication.

The optional parameter adding determines whether the result is stored in $\mathbf{C}$ or added to $\mathbf{C}$.

if (adding) $\mathbf{C} = \mathbf{C} + \mathbf{A} \cdot \mathbf{B}$

else $\mathbf{C} = \mathbf{A} \cdot \mathbf{B}$

It is assumed that $\mathbf{A}$ and $\mathbf{B}$ have compatible sizes and that $\mathbf{C}$ already has the right size.

The following alignment conditions have to be fulfilled: $MB_A=MB_C$, $NB_A=MB_B$ and $NB_B=NB_C$.

◆ zmult()

template<typename NumberType>

void dftfe::ScaLAPACKMatrix< NumberType >::zmult	(	const NumberType	b,
		const ScaLAPACKMatrix< NumberType > &	B,
		const NumberType	c,
		ScaLAPACKMatrix< NumberType > &	C,
		const bool	conjugate_transpose_A = false,
		const bool	conjugate_transpose_B = false ) const

Matrix-matrix-multiplication:

The operations based on the input parameters and the alignment conditions are summarized in the following table:

conjugate_transpose_A	conjugate_transpose_B	Block Sizes	Operation
false	false	$MB_A=MB_C$ $NB_A=MB_B$ $NB_B=NB_C$	$\mathbf{C} = b \mathbf{A} \cdot \mathbf{B} + c \mathbf{C}$
false	true	$MB_A=MB_C$ $NB_A=NB_B$ $MB_B=NB_C$	$\mathbf{C} = b \mathbf{A} \cdot \mathbf{B}^C + c \mathbf{C}$
true	false	$MB_A=MB_B$ $NB_A=MB_C$ $NB_B=NB_C$	$\mathbf{C} = b \mathbf{A}^C \cdot \mathbf{B} + c \mathbf{C}$
true	true	$MB_A=NB_B$ $NB_A=MB_C$ $MB_B=NB_C$	$\mathbf{C} = b \mathbf{A}^C \cdot \mathbf{B}^C + c \mathbf{C}$

std::vector<NumberType> dftfe::ScaLAPACKMatrix< NumberType >::work

mutableprivate

Workspace array.

The documentation for this class was generated from the following files:

workspace/include/process_grid.h
workspace/include/scalapackWrapper.h

Public Types

Public Member Functions

Private Member Functions

Private Attributes

Detailed Description

Member Typedef Documentation

◆ size_type

Constructor & Destructor Documentation

◆ ScaLAPACKMatrix() [1/2]

◆ ScaLAPACKMatrix() [2/2]

Member Function Documentation

◆ add()

◆ compute_cholesky_factorization()

◆ compute_lu_factorization()

◆ conjugate()

◆ copy_conjugate_transposed()

◆ copy_to()

◆ copy_transposed()

◆ eigenpairs_hermitian()

◆ eigenpairs_hermitian_by_index()

◆ eigenpairs_hermitian_by_index_MRRR()

◆ eigenpairs_hermitian_MRRR()

◆ get_property()

◆ get_state()

◆ global_column()

◆ global_row()

◆ invert()

◆ local_el() [1/2]

◆ local_el() [2/2]

◆ local_m()

◆ local_n()

◆ m()

◆ mmult()

◆ mTmult()

◆ mult()

◆ n()

◆ reinit() [1/2]

◆ reinit() [2/2]

◆ scale_columns()

◆ scale_columns_realfactors()

◆ scale_rows()

◆ scale_rows_realfactors()

◆ set_property()

◆ Tmmult()

◆ TmTmult()

◆ zadd()

◆ zCmCmult()

◆ zCmmult()

◆ zmCmult()

◆ zmmult()

◆ zmult()

Member Data Documentation

◆ column_block_size

◆ descriptor

◆ first_process_column

◆ first_process_row

◆ grid

◆ ipiv

◆ iwork

◆ mutex

◆ n_columns

◆ n_local_columns

◆ n_local_rows

◆ n_rows

◆ property

◆ row_block_size

◆ state

◆ submatrix_column

◆ submatrix_row

◆ uplo

◆ values

◆ work