Namespace for auxiliary functions/classes. More...

Namespaces
namespace	acoustic

namespace	acoustic_analogy

namespace	alloc

namespace	collector_memory
	Helper functions useful for allocating collector memory.

namespace	container

namespace	coupling

namespace	debug

namespace	detail_

namespace	dg

namespace	dlb

namespace	dlbTimer

namespace	fc

namespace	filter

namespace	fv

namespace	geom

namespace	grid

namespace	io

namespace	lb

namespace	lblpt

namespace	logtable

namespace	lpt

namespace	ls

namespace	math

namespace	mpi

namespace	parallel_io

namespace	post

namespace	rb

namespace	sbp

namespace	structured

namespace	tensor
	Namespace that contains all classes, functions and constants needed for Tensor.

Classes
class	CartesianSolver

struct	is_unsigned

struct	is_unsigned< MUint >

struct	is_unsigned< MUlong >

struct	maia_signed

struct	maia_unsigned

struct	PatchRefinement

struct	RangeIterator
	Dummy iterator class. More...

struct	type_traits

struct	type_traits< long >

struct	type_traits< MBool >

struct	type_traits< MChar >

struct	type_traits< MFloat >

struct	type_traits< MInt >

struct	type_traits< MLong >

struct	type_traits< MString >

struct	type_traits< MUint >

struct	type_traits< MUlong >

struct	type_traits< uint_fast8_t >

Functions
template<class UnaryFunction >
void	parallelFor_base (MInt begin, MInt end, UnaryFunction &&f)
	Wrapper function for parallel for loop (no PSTL) More...

template<class UnaryFunction >
void	parallelFor_pstl (MInt begin, MInt end, UnaryFunction &&f)
	Wrapper function for parallel for loop (PSTL) More...

template<MBool portedToGpu = false, class UnaryFunction >
void	parallelFor (MInt begin, MInt end, UnaryFunction &&f)
	Wrapper function for parallel for loop. More...

template<class UnaryFunction , class T >
void	parallelFor_base (const std::vector< T > &container, UnaryFunction &&f)
	Wrapper function for parallel for loop (STL container based, no PSTL) More...

template<class UnaryFunction , class T >
void	parallelFor_pstl (const std::vector< T > &container, UnaryFunction &&f)
	Wrapper function for parallel for loop (STL container based, PSTL) More...

template<MBool portedToGpu = false, class UnaryFunction , class T >
void	parallelFor (const std::vector< T > &container, UnaryFunction &&f)
	Wrapper function for parallel for loop (STL container based) More...

template<MInt nDim, class UnaryFunction >
void	parallelFor_base (std::array< MInt, nDim > begin, std::array< MInt, nDim > end, UnaryFunction &&f)
	Wrapper function for parallel nested for loops [NON-PSTL]. More...

template<MInt nDim, class UnaryFunction >
void	parallelFor_pstl (std::array< MInt, nDim > begin, std::array< MInt, nDim > end, UnaryFunction &&f)
	Wrapper function for parallel nested for loops [PSTL]. More...

template<MBool portedToGpu = false, MInt nDim, class UnaryFunction >
void	parallelFor (std::array< MInt, nDim > begin, std::array< MInt, nDim > end, UnaryFunction &&f)
	Wrapper function for parallel nested for loops. More...

Detailed Description

Classes with constant number of space dimensions nd.

Helper class for automatic tracing.

type traits for dealing with signed vs unsigned indices

Note: we should not do this...

Todo:: labels:toenhance use <type_traits> instead of this hack

Function Documentation

◆ parallelFor() [1/3]

template<MBool portedToGpu = false, class UnaryFunction , class T >

void maia::parallelFor	(	const std::vector< T > &	container,
		UnaryFunction &&	f
	)

inline

Author: Miro Gondrum

Date: 18.02.2022

Parameters

[in]	container	STL container over whose entries are looped over
[in]	f	function which represents the loops body

This function wraps a for loop, such that it is performed parallel depending on the given compiler flags. This loop has to be of following type: for( auto& item: container) { f(item); }

Definition at line 197 of file parallelfor.h.

                                                                          {
  if constexpr(portedToGpu) {
    parallelFor_pstl(container, f);
  } else {
    parallelFor_base(container, f);
  }
}

◆ parallelFor() [2/3]

template<MBool portedToGpu = false, class UnaryFunction >

void maia::parallelFor	(	MInt	begin,
		MInt	end,
		UnaryFunction &&	f
	)

inline

Author: Miro Gondrum

Date: 02.12.2021

Parameters

[in]	begin	start value of iteration
[in]	end	end value of iteration
[in]	f	function which represents the loops body

This function wraps a for loop, such that it is performed parallel depending on the given compiler flags. This loop has to be of following type: for( int i = begin; i < end ; i++) { f(i); }

Definition at line 147 of file parallelfor.h.

                                                                 {
  if constexpr(portedToGpu) {
    parallelFor_pstl(begin, end, f);
  } else {
    parallelFor_base(begin, end, f);
  }
}

◆ parallelFor() [3/3]

template<MBool portedToGpu = false, MInt nDim, class UnaryFunction >

void maia::parallelFor	(	std::array< MInt, nDim >	begin,
		std::array< MInt, nDim >	end,
		UnaryFunction &&	f
	)

inline

Author: Marian Albers, Miro Gondrum

Date: 07.03.2023

Parameters

[in]	begin[nDim]	start value of iteration
[in]	end[nDim]	end value of iteration
[in]	f	function which represents the loops body

This function wraps a one or multiple nested for loops, such that it is performed parallel depending on the given compiler flags. This loop has to be of following type: for( int i = begin[0]; i < end[0] ; i++) { f(i); } or for( int i = begin[0]; i < end[0] ; i++) { for( int j = begin[1]; j < end[1] ; j++) { f(i,j); } }

Definition at line 306 of file parallelfor.h.

                                                                                                 {
  if constexpr(portedToGpu) {
    parallelFor_pstl<nDim>(begin, end, f);
  } else {
    parallelFor_base<nDim>(begin, end, f);
  }
}

◆ parallelFor_base() [1/3]

template<class UnaryFunction , class T >

void maia::parallelFor_base	(	const std::vector< T > &	container,
		UnaryFunction &&	f
	)

inline

Author: Miro Gondrum

Date: 21.02.2022

Note: PLEASE USE parallelFor(..) function

Definition at line 161 of file parallelfor.h.

                                                                               {
  const MInt end = container.size();
#if defined(_OPENMP)
#pragma omp parallel for schedule(static, CHUNK_SIZE) default(none) shared(end, f, container)
#endif
  for(MInt i = 0; i < end; i++) {
    f(container[i]);
  }
}

◆ parallelFor_base() [2/3]

template<class UnaryFunction >

void maia::parallelFor_base	(	MInt	begin,
		MInt	end,
		UnaryFunction &&	f
	)

inline

Author: Miro Gondrum

Date: 21.02.2022

Note: PLEASE USE parallelFor(..) function

Definition at line 99 of file parallelfor.h.

                                                                      {
#if defined(_OPENMP)
#pragma omp parallel for schedule(static, CHUNK_SIZE) default(none) shared(begin, end, f)
#endif
  for(MInt i = begin; i < end; i++) {
    f(i);
  }
}

◆ parallelFor_base() [3/3]

template<MInt nDim, class UnaryFunction >

void maia::parallelFor_base	(	std::array< MInt, nDim >	begin,
		std::array< MInt, nDim >	end,
		UnaryFunction &&	f
	)

inline

Author: Marian Albers, Miro Gondrum

Date: 07.03.2023

Note: PLEASE USE parallelFor(..) function

Definition at line 212 of file parallelfor.h.

                                                                                                      {
  if constexpr(nDim == 3) {
#if defined(_OPENMP)
#pragma omp parallel for schedule(static, CHUNK_SIZE) default(none) shared(begin, end, f) collapse(3)
#endif
    for(MInt k = begin[2]; k < end[2]; k++) {
      for(MInt j = begin[1]; j < end[1]; j++) {
        for(MInt i = begin[0]; i < end[0]; i++) {
          f(i, j, k);
        }
      }
    }
  } else if constexpr(nDim == 2) {
#if defined(_OPENMP)
#pragma omp parallel for schedule(static, CHUNK_SIZE) default(none) shared(begin, end, f) collapse(2)
#endif
    for(MInt j = begin[1]; j < end[1]; j++) {
      for(MInt i = begin[0]; i < end[0]; i++) {
        f(i, j);
      }
    }
  } else {
    mTerm(1, AT_, "Only nDim==2 and nDim==3 supported");
  }
}

◆ parallelFor_pstl() [1/3]

template<class UnaryFunction , class T >

void maia::parallelFor_pstl	(	const std::vector< T > &	container,
		UnaryFunction &&	f
	)

inline

Author: Miro Gondrum

Date: 21.02.2022

Note: PLEASE USE parallelFor(..) function

Definition at line 177 of file parallelfor.h.

                                                                               {
#if defined(MAIA_PSTL)
  std::for_each_n(std::execution::par_unseq, container.begin(), container.end(), f);
#else
  parallelFor_base(container, f);
#endif
}

◆ parallelFor_pstl() [2/3]

template<class UnaryFunction >

void maia::parallelFor_pstl	(	MInt	begin,
		MInt	end,
		UnaryFunction &&	f
	)

inline

Author: Miro Gondrum

Date: 21.02.2022

Note: PLEASE USE parallelFor(..) function

Definition at line 114 of file parallelfor.h.

                                                                      {
#if defined(MAIA_PSTL)
#if defined(MAIA_NVHPC_COMPILER)
  // WAR: https://nvbugs/3285841
  // TODO labels:gpu So far this only works with begin == 0. The
  // RangeIterator is not working for nvhpc's pstl implementation, yet.
  auto begin_ = thrust::counting_iterator(MInt{begin});
  auto end_ = end;
#else
  auto begin_ = RangeIterator(begin);
  auto end_ = RangeIterator(end);
#endif
  // TODO miro: GCC: How to trigger the usage of more threads? Currently in my
  // case it using only 1 thread. Hence, OpenMP is performing better
  std::for_each_n(std::execution::par_unseq, begin_, end_, f);
#else /* defined(MAIA_PSTL) */
  parallelFor_base(begin, end, f);
#endif
}

◆ parallelFor_pstl() [3/3]

template<MInt nDim, class UnaryFunction >

void maia::parallelFor_pstl	(	std::array< MInt, nDim >	begin,
		std::array< MInt, nDim >	end,
		UnaryFunction &&	f
	)

inline

Author: Marian Albers, Miro Gondrum

Date: 07.03.2023

Note: PLEASE USE parallelFor(..) function

Definition at line 244 of file parallelfor.h.

                                                                                                      {
#if defined(MAIA_PSTL)
  std::array<MInt, nDim> size{};
  const MInt beginI = 0;
  MInt endI = 1;
  for(MInt dim = 0; dim < nDim; ++dim) {
    size[dim] = end[dim] - begin[dim];
    endI *= size[dim];
  }
#if defined(MAIA_NVHPC_COMPILER)
  // WAR: https://nvbugs/3285841
  // TODO labels:gpu So far this only works with begin == 0. The
  // RangeIterator is not working for nvhpc's pstl implementation, yet.
  auto begin_ = thrust::counting_iterator(MInt{beginI});
  auto end_ = endI;
#else
  auto begin_ = RangeIterator(beginI);
  auto end_ = RangeIterator(endI);
#endif
 
  if constexpr(nDim == 3) {
    std::for_each_n(std::execution::par_unseq, begin_, end_, [=](auto& I) {
      const MInt k = (I / (size[0] * size[1])) + begin[2];
      const MInt j = ((I - k * size[0] * size[1]) / size[0]) + begin[1];
      const MInt i = (I % size[0]) + begin[0];
 
      f(i, j, k);
    });
  } else if constexpr(nDim == 2) {
    std::for_each_n(std::execution::par_unseq, begin_, end_, [=](auto& I) {
      const MInt j = (I / size[0]) + begin[1];
      const MInt i = (I % size[0]) + begin[0];
 
      f(i, j);
    });
  }
#else /* defined(MAIA_PSTL) */
  parallelFor_base<nDim>(begin, end, f);
#endif
}

Namespaces

Classes

Functions

Detailed Description

Function Documentation

◆ parallelFor() [1/3]

◆ parallelFor() [2/3]

◆ parallelFor() [3/3]

◆ parallelFor_base() [1/3]

◆ parallelFor_base() [2/3]

◆ parallelFor_base() [3/3]

◆ parallelFor_pstl() [1/3]

◆ parallelFor_pstl() [2/3]

◆ parallelFor_pstl() [3/3]