diff --git a/master/add_8h_source.html b/master/add_8h_source.html index 8c304045cf..5414c34594 100644 --- a/master/add_8h_source.html +++ b/master/add_8h_source.html @@ -95,30 +95,32 @@
12
13#ifdef DLAF_WITH_GPU
14
-
15#include <blas.hh>
-
16#include <whip.hpp>
-
17
-
18#include <dlaf/gpu/blas/api.h>
-
19#include <dlaf/types.h>
-
20
-
21namespace dlaf::gpulapack {
+
15#include <complex>
+
16
+
17#include <blas.hh>
+
18#include <whip.hpp>
+
19
+
20#include <dlaf/gpu/blas/api.h>
+
21#include <dlaf/types.h>
22
-
23template <class T>
-
24void add(const blas::Uplo uplo, const SizeType m, const SizeType n, const T& alpha, const T* a,
-
25 const SizeType lda, T* b, const SizeType ldb, const whip::stream_t stream);
-
26
-
27#define DLAF_CUBLAS_ADD_ETI(kword, Type) \
-
28 kword template void add(const blas::Uplo uplo, const SizeType m, const SizeType n, const Type& alpha, \
-
29 const Type* a, const SizeType lda, Type* b, const SizeType ldb, \
-
30 const whip::stream_t stream)
-
31
-
32DLAF_CUBLAS_ADD_ETI(extern, float);
-
33DLAF_CUBLAS_ADD_ETI(extern, double);
-
34DLAF_CUBLAS_ADD_ETI(extern, std::complex<float>);
-
35DLAF_CUBLAS_ADD_ETI(extern, std::complex<double>);
-
36}
-
37
-
38#endif
+
23namespace dlaf::gpulapack {
+
24
+
25template <class T>
+
26void add(const blas::Uplo uplo, const SizeType m, const SizeType n, const T& alpha, const T* a,
+
27 const SizeType lda, T* b, const SizeType ldb, const whip::stream_t stream);
+
28
+
29#define DLAF_CUBLAS_ADD_ETI(kword, Type) \
+
30 kword template void add(const blas::Uplo uplo, const SizeType m, const SizeType n, const Type& alpha, \
+
31 const Type* a, const SizeType lda, Type* b, const SizeType ldb, \
+
32 const whip::stream_t stream)
+
33
+
34DLAF_CUBLAS_ADD_ETI(extern, float);
+
35DLAF_CUBLAS_ADD_ETI(extern, double);
+
36DLAF_CUBLAS_ADD_ETI(extern, std::complex<float>);
+
37DLAF_CUBLAS_ADD_ETI(extern, std::complex<double>);
+
38}
+
39
+
40#endif
dlaf::tile::add
void add(T alpha, const matrix::Tile< const T, D > &tile_b, const matrix::Tile< T, D > &tile_a)
types.h
diff --git a/master/auxiliary_2norm_2api_8h_source.html b/master/auxiliary_2norm_2api_8h_source.html index a17aac42cc..fe05c235f4 100644 --- a/master/auxiliary_2norm_2api_8h_source.html +++ b/master/auxiliary_2norm_2api_8h_source.html @@ -92,41 +92,43 @@
9//
10#pragma once
11
-
12#include <pika/execution.hpp>
+
12#include <complex>
13
-
14#include <dlaf/communication/communicator_grid.h>
-
15#include <dlaf/matrix/matrix.h>
-
16#include <dlaf/types.h>
-
17
-
18namespace dlaf::auxiliary::internal {
+
14#include <pika/execution.hpp>
+
15
+
16#include <dlaf/communication/communicator_grid.h>
+
17#include <dlaf/matrix/matrix.h>
+
18#include <dlaf/types.h>
19
-
20template <Backend backend, Device device, class T>
-
21struct Norm {};
-
22
-
23template <class T>
-
-
24struct Norm<Backend::MC, Device::CPU, T> {
-
25 static pika::execution::experimental::unique_any_sender<dlaf::BaseType<T>> max_L(
-
26 comm::CommunicatorGrid& comm_grid, comm::Index2D rank, Matrix<const T, Device::CPU>& matrix);
-
27
-
28 static pika::execution::experimental::unique_any_sender<dlaf::BaseType<T>> max_G(
-
29 comm::CommunicatorGrid& comm_grid, comm::Index2D rank, Matrix<const T, Device::CPU>& matrix);
-
30};
+
20namespace dlaf::auxiliary::internal {
+
21
+
22template <Backend backend, Device device, class T>
+
23struct Norm {};
+
24
+
25template <class T>
+
+
26struct Norm<Backend::MC, Device::CPU, T> {
+
27 static pika::execution::experimental::unique_any_sender<dlaf::BaseType<T>> max_L(
+
28 comm::CommunicatorGrid& comm_grid, comm::Index2D rank, Matrix<const T, Device::CPU>& matrix);
+
29
+
30 static pika::execution::experimental::unique_any_sender<dlaf::BaseType<T>> max_G(
+
31 comm::CommunicatorGrid& comm_grid, comm::Index2D rank, Matrix<const T, Device::CPU>& matrix);
+
32};
-
31
-
32// ETI
-
33#define DLAF_NORM_ETI(KWORD, DATATYPE) KWORD template struct Norm<Backend::MC, Device::CPU, DATATYPE>;
-
34
-
35DLAF_NORM_ETI(extern, float)
-
36DLAF_NORM_ETI(extern, double)
-
37DLAF_NORM_ETI(extern, std::complex<float>)
-
38DLAF_NORM_ETI(extern, std::complex<double>)
-
39}
+
33
+
34// ETI
+
35#define DLAF_NORM_ETI(KWORD, DATATYPE) KWORD template struct Norm<Backend::MC, Device::CPU, DATATYPE>;
+
36
+
37DLAF_NORM_ETI(extern, float)
+
38DLAF_NORM_ETI(extern, double)
+
39DLAF_NORM_ETI(extern, std::complex<float>)
+
40DLAF_NORM_ETI(extern, std::complex<double>)
+
41}
Definition communicator_grid.h:37
-
Definition api.h:21
+
Definition api.h:23
diff --git a/master/auxiliary_2norm_2mc_8h_source.html b/master/auxiliary_2norm_2mc_8h_source.html index 1176b6a80c..8dea521cc3 100644 --- a/master/auxiliary_2norm_2mc_8h_source.html +++ b/master/auxiliary_2norm_2mc_8h_source.html @@ -249,7 +249,7 @@
dlaf::comm::Communicator::rank
IndexT_MPI rank() const noexcept
Return the rank of the current process in the Communicator.
dlaf::common::Index2D< IndexT_MPI, TAG_MPI >
dlaf::internal::Policy
Definition policy.h:24
-
dlaf::matrix::Matrix
Definition matrix.h:61
+
dlaf::matrix::Matrix
Definition matrix.h:62
dlaf::common::make_data
auto make_data(Data &&data) noexcept
Definition data.h:78
distribution.h
reduce.h
@@ -263,8 +263,8 @@
reduce.h
types.h
util_matrix.h
-
dlaf::matrix::square_blocksize
bool square_blocksize(const MatrixLike &m) noexcept
Returns true if the matrix block size is square.
Definition util_matrix.h:48
-
dlaf::matrix::square_size
bool square_size(const MatrixLike &m) noexcept
Returns true if the matrix is square.
Definition util_matrix.h:42
+
dlaf::matrix::square_blocksize
bool square_blocksize(const MatrixLike &m) noexcept
Returns true if the matrix block size is square.
Definition util_matrix.h:49
+
dlaf::matrix::square_size
bool square_size(const MatrixLike &m) noexcept
Returns true if the matrix is square.
Definition util_matrix.h:43
vector.h
diff --git a/master/band__to__tridiag_8h_source.html b/master/band__to__tridiag_8h_source.html index 79f2b0ff62..989a08f097 100644 --- a/master/band__to__tridiag_8h_source.html +++ b/master/band__to__tridiag_8h_source.html @@ -166,8 +166,8 @@
dlaf::common::Size2D< IndexT_MPI, TAG_MPI >
communicator_grid.h
matrix.h
-
dlaf::eigensolver::internal::BandToTridiag
Definition api.h:37
-
dlaf::eigensolver::internal::TridiagResult
Definition api.h:19
+
dlaf::eigensolver::internal::BandToTridiag
Definition api.h:39
+
dlaf::eigensolver::internal::TridiagResult
Definition api.h:21
types.h
util_matrix.h
diff --git a/master/blas_2tile_8h_source.html b/master/blas_2tile_8h_source.html index 24944242af..c47abaf45e 100644 --- a/master/blas_2tile_8h_source.html +++ b/master/blas_2tile_8h_source.html @@ -413,7 +413,7 @@
DLAF_MAKE_CALLABLE_OBJECT
#define DLAF_MAKE_CALLABLE_OBJECT(fname)
Definition callable_object.h:29
dlaf::common::internal::SingleThreadedBlasScope
Definition single_threaded_blas.h:20
dlaf::internal::Policy
Definition policy.h:24
-
dlaf::matrix::Tile
Definition tile.h:332
+
dlaf::matrix::Tile
Definition tile.h:333
copy_tile.h
gpublas.h
tile.h
diff --git a/master/broadcast__panel_8h_source.html b/master/broadcast__panel_8h_source.html index 579337e6a2..67600e7b0f 100644 --- a/master/broadcast__panel_8h_source.html +++ b/master/broadcast__panel_8h_source.html @@ -261,8 +261,8 @@
dlaf::comm::broadcast
void broadcast(comm::IndexT_MPI rank_root, matrix::Panel< axis, T, D, storage > &panel, comm::CommunicatorPipeline< coord_to_communicator_type(orthogonal(axis))> &serial_comm)
Definition broadcast_panel.h:61
dlaf::comm::CommunicatorPipeline
Definition communicator_pipeline.h:41
dlaf::common::Index2D< SizeType, matrix::LocalTile_TAG >
-
dlaf::matrix::Matrix
Definition matrix.h:61
-
dlaf::matrix::Matrix::readwrite
ReadWriteSenderType readwrite(const LocalTileIndex &index) noexcept
Definition matrix.h:153
+
dlaf::matrix::Matrix
Definition matrix.h:62
+
dlaf::matrix::Matrix::readwrite
ReadWriteSenderType readwrite(const LocalTileIndex &index) noexcept
Definition matrix.h:154
index.h
dlaf::comm::IndexT_MPI
int IndexT_MPI
Type used for indexes in MPI API.
Definition index.h:20
communicator_pipeline.h
diff --git a/master/bt__band__to__tridiag_8h_source.html b/master/bt__band__to__tridiag_8h_source.html index a31375af1a..b4e3349813 100644 --- a/master/bt__band__to__tridiag_8h_source.html +++ b/master/bt__band__to__tridiag_8h_source.html @@ -147,11 +147,11 @@
133}
dlaf::eigensolver::internal::bt_band_to_tridiagonal
void bt_band_to_tridiagonal(const SizeType band_size, MatrixRef< T, D > &mat_e, matrix::Matrix< const T, Device::CPU > &mat_hh)
Definition bt_band_to_tridiag.h:60
dlaf::comm::CommunicatorGrid
Definition communicator_grid.h:37
-
dlaf::matrix::Matrix
Definition matrix.h:61
-
dlaf::matrix::internal::MatrixRef
Definition matrix_ref.h:171
+
dlaf::matrix::Matrix
Definition matrix.h:62
+
dlaf::matrix::internal::MatrixRef
Definition matrix_ref.h:172
matrix.h
matrix_ref.h
-
dlaf::eigensolver::internal::BackTransformationT2B
Definition api.h:23
+
dlaf::eigensolver::internal::BackTransformationT2B
Definition api.h:25
types.h
util_matrix.h
diff --git a/master/bt__reduction__to__band_8h_source.html b/master/bt__reduction__to__band_8h_source.html index 21473bb54d..59a23e30cc 100644 --- a/master/bt__reduction__to__band_8h_source.html +++ b/master/bt__reduction__to__band_8h_source.html @@ -156,11 +156,11 @@
108}
dlaf::eigensolver::internal::bt_reduction_to_band
void bt_reduction_to_band(const SizeType b, MatrixRef< T, device > &mat_c, Matrix< const T, device > &mat_v, Matrix< const T, Device::CPU > &mat_taus)
Definition bt_reduction_to_band.h:45
dlaf::comm::CommunicatorGrid
Definition communicator_grid.h:37
-
dlaf::matrix::internal::MatrixRef
Definition matrix_ref.h:171
+
dlaf::matrix::internal::MatrixRef
Definition matrix_ref.h:172
communicator_grid.h
matrix.h
matrix_ref.h
-
dlaf::eigensolver::internal::BackTransformationReductionToBand
Definition api.h:21
+
dlaf::eigensolver::internal::BackTransformationReductionToBand
Definition api.h:23
types.h
util_matrix.h
diff --git a/master/copy_8h_source.html b/master/copy_8h_source.html index 4991d71879..28ac979d55 100644 --- a/master/copy_8h_source.html +++ b/master/copy_8h_source.html @@ -283,9 +283,9 @@
dlaf::common::Index2D< SizeType, matrix::LocalTile_TAG >
dlaf::common::Size2D< SizeType, matrix::LocalTile_TAG >
dlaf::internal::Policy
Definition policy.h:24
-
dlaf::matrix::Matrix
Definition matrix.h:61
-
dlaf::matrix::Matrix::retiledSubPipeline
Matrix retiledSubPipeline(const LocalTileSize &tiles_per_block) noexcept
Definition matrix.h:184
-
dlaf::matrix::Matrix::readwrite
ReadWriteSenderType readwrite(const LocalTileIndex &index) noexcept
Definition matrix.h:153
+
dlaf::matrix::Matrix
Definition matrix.h:62
+
dlaf::matrix::Matrix::retiledSubPipeline
Matrix retiledSubPipeline(const LocalTileSize &tiles_per_block) noexcept
Definition matrix.h:185
+
dlaf::matrix::Matrix::readwrite
ReadWriteSenderType readwrite(const LocalTileIndex &index) noexcept
Definition matrix.h:154
dlaf::comm::IndexT_MPI
int IndexT_MPI
Type used for indexes in MPI API.
Definition index.h:20
communicator.h
copy_tile.h
@@ -301,10 +301,10 @@
dlaf::to_int
auto to_int(const T unsigned_value)
Definition types.h:248
util_math.h
util_matrix.h
-
dlaf::matrix::equal_process_grid
bool equal_process_grid(const MatrixLike< const T, D > &m, const comm::CommunicatorGrid &g) noexcept
Returns true if the matrix is distributed on the communication grid.
Definition util_matrix.h:78
-
dlaf::matrix::single_tile_per_block
bool single_tile_per_block(const MatrixLike &m) noexcept
Returns true if the matrix has a single tile per block.
Definition util_matrix.h:54
-
dlaf::matrix::local_matrix
bool local_matrix(const MatrixLike< const T, D > &m) noexcept
Returns true if the matrix is local to a process.
Definition util_matrix.h:72
-
dlaf::matrix::equal_size
bool equal_size(const MatrixLikeA &lhs, const MatrixLikeB &rhs) noexcept
Returns true if matrices have equal sizes.
Definition util_matrix.h:60
+
dlaf::matrix::equal_process_grid
bool equal_process_grid(const MatrixLike< const T, D > &m, const comm::CommunicatorGrid &g) noexcept
Returns true if the matrix is distributed on the communication grid.
Definition util_matrix.h:79
+
dlaf::matrix::single_tile_per_block
bool single_tile_per_block(const MatrixLike &m) noexcept
Returns true if the matrix has a single tile per block.
Definition util_matrix.h:55
+
dlaf::matrix::local_matrix
bool local_matrix(const MatrixLike< const T, D > &m) noexcept
Returns true if the matrix is local to a process.
Definition util_matrix.h:73
+
dlaf::matrix::equal_size
bool equal_size(const MatrixLikeA &lhs, const MatrixLikeB &rhs) noexcept
Returns true if matrices have equal sizes.
Definition util_matrix.h:61