d1/d7e/operator_8hh_source.html

/*  This file is part of the OpenLB library

 *

 *  Copyright (C) 2022 Adrian Kummerlaender

 *  E-mail contact: info@openlb.net

 *  The most recent release of OpenLB can be downloaded at

 *  <http://www.openlb.net/>

 *

 *  This program is free software; you can redistribute it and/or

 *  modify it under the terms of the GNU General Public License

 *  as published by the Free Software Foundation; either version 2

 *  of the License, or (at your option) any later version.

 *

 *  This program is distributed in the hope that it will be useful,

 *  but WITHOUT ANY WARRANTY; without even the implied warranty of

 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

 *  GNU General Public License for more details.

 *

 *  You should have received a copy of the GNU General Public

 *  License along with this program; if not, write to the Free

 *  Software Foundation, Inc., 51 Franklin Street, Fifth Floor,

 *  Boston, MA  02110-1301, USA.

*/


#ifndef GPU_CUDA_OPERATOR_HH

#define GPU_CUDA_OPERATOR_HH


#include "operator.h"


#include "context.hh"

#include "dynamics.hh"


namespace olb {


struct CollisionSubdomainMask;


namespace gpu {


namespace cuda {


template <typename T, typename DESCRIPTOR, typename DYNAMICS>


class MaskedCollision {

private:

  ParametersOfOperatorD<T,DESCRIPTOR,DYNAMICS> _parameters;

  bool* _mask;


  CellStatistic<T> apply(DeviceContext<T,DESCRIPTOR>& lattice, CellID iCell) __device__ {

    DataOnlyCell<T,DESCRIPTOR> cell(lattice, iCell);

    return DYNAMICS().apply(cell, _parameters);

  }


public:


  MaskedCollision(ParametersOfOperatorD<T,DESCRIPTOR,DYNAMICS>& parameters, bool* mask) any_platform:

    _parameters{parameters},

    _mask{mask}

  { }


  bool operator()(DeviceContext<T,DESCRIPTOR>& lattice, CellID iCell) __device__ {

    if (_mask[iCell]) {

      apply(lattice, iCell);

      return true;

    }

    return false;

  }


  bool operator()(DeviceContext<T,DESCRIPTOR>& lattice, CellID iCell, CellStatistic<T>& statistic) __device__ {

    if (_mask[iCell]) {

      statistic = apply(lattice, iCell);

      return true;

    }

    return false;

  }


};


template <typename T, typename DESCRIPTOR, typename DYNAMICS>


class ListedCollision {

private:

  ParametersOfOperatorD<T,DESCRIPTOR,DYNAMICS> _parameters;


public:


  ListedCollision(ParametersOfOperatorD<T,DESCRIPTOR,DYNAMICS>& parameters) __host__:

    _parameters{parameters}

  { }


  bool operator()(DeviceContext<T,DESCRIPTOR>& lattice, CellID iCell) __device__ {

    DataOnlyCell<T,DESCRIPTOR> cell(lattice, iCell);

    DYNAMICS().apply(cell, _parameters);

    return true;

  }


  bool operator()(DeviceContext<T,DESCRIPTOR>& lattice, CellID iCell, CellStatistic<T>& statistic) __device__ {

    DataOnlyCell<T,DESCRIPTOR> cell(lattice, iCell);

    statistic = DYNAMICS().apply(cell, _parameters);

    return true;

  }


};


template <typename OPERATOR>


class MaskedPostProcessor {

private:

  bool* _mask;


public:


  MaskedPostProcessor(bool* mask) any_platform:

    _mask{mask}

  { }


  template <typename T, typename DESCRIPTOR>


  bool operator()(DeviceBlockLattice<T,DESCRIPTOR>& lattice, CellID iCell) __device__ {

    if (_mask[iCell]) {

      Cell<T,DESCRIPTOR> cell(lattice, iCell);

      OPERATOR().apply(cell);

      return true;

    }

    return false;

  }


};


template <typename OPERATOR>


struct ListedPostProcessor {

  template <typename T, typename DESCRIPTOR>


  bool operator()(DeviceBlockLattice<T,DESCRIPTOR>& lattice, CellID iCell) __device__ {

    Cell<T,DESCRIPTOR> cell(lattice, iCell);

    OPERATOR().apply(cell);

    return true;

  }


};


template <typename T, typename DESCRIPTOR, typename OPERATOR>


class ListedPostProcessorWithParameters {

private:

  ParametersOfOperatorD<T,DESCRIPTOR,OPERATOR> _parameters;


public:


  ListedPostProcessorWithParameters(ParametersOfOperatorD<T,DESCRIPTOR,OPERATOR>& parameters) __host__:

    _parameters{parameters}

  { }


  bool operator()(DeviceBlockLattice<T,DESCRIPTOR>& lattice, CellID iCell) __device__ {

    Cell<T,DESCRIPTOR> cell(lattice, iCell);

    OPERATOR().apply(cell, _parameters);

    return true;

  }


};


template <typename COUPLER>


struct UnmaskedCoupling {

  template <typename CONTEXT>


  bool operator()(CONTEXT& lattices,

                  CellID iCell) __device__ {

    auto cells = lattices.exchange_values([&](auto name) -> auto {

      return Cell{lattices.get(name), iCell};

    });

    COUPLER().apply(cells);

    return true;

  }


};


template <typename COUPLER, typename COUPLEES>


class UnmaskedCouplingWithParameters {

private:

  typename COUPLER::parameters::template decompose_into<

    AbstractCouplingO<COUPLEES>::ParametersD::template include_fields

  > _parameters;


public:

  template <typename PARAMETERS>


  UnmaskedCouplingWithParameters(PARAMETERS& parameters) any_platform:

    _parameters{parameters}

  { }


  template <typename CONTEXT>


  bool operator()(CONTEXT& lattices,

                  CellID iCell) __device__ {

    auto cells = lattices.exchange_values([&](auto name) -> auto {

      return Cell{lattices.get(name), iCell};

    });

    COUPLER().apply(cells, _parameters);

    return true;

  }


};


template <typename T, typename DESCRIPTOR, typename... DYNAMICS>

std::function<void(ConcreteBlockLattice<T,DESCRIPTOR,Platform::GPU_CUDA>&)>


getFusedCollisionO() {

  return [](ConcreteBlockLattice<T,DESCRIPTOR,Platform::GPU_CUDA>& block) {

    bool* subdomain = block.template getData<CollisionSubdomainMask>().deviceData();

    DeviceContext<T,DESCRIPTOR> lattice(block);

    if (block.statisticsEnabled()) {

      call_operators_with_statistics(

        lattice,

        subdomain,

        MaskedCollision<T,DESCRIPTOR,DYNAMICS>{

          block.template getData<OperatorParameters<DYNAMICS>>().parameters,

          block.template getData<DynamicsMask<DYNAMICS>>().deviceData()

        }...,

        DynamicDispatchCollision{});

    } else {

      call_operators(

        lattice,

        subdomain,

        MaskedCollision<T,DESCRIPTOR,DYNAMICS>{

          block.template getData<OperatorParameters<DYNAMICS>>().parameters,

          block.template getData<DynamicsMask<DYNAMICS>>().deviceData()

        }...,

        DynamicDispatchCollision{});

    }

  };

}


namespace kernel {


template <typename CONTEXT, typename... OPERATORS>


void call_operators(CONTEXT lattice, bool* subdomain, OPERATORS... ops) __global__ {

  const CellID iCell = blockIdx.x * blockDim.x + threadIdx.x;

  if (!(iCell < lattice.getNcells()) || !subdomain[iCell]) {

    return;

  }

  (ops(lattice, iCell) || ... );

}


template <typename CONTEXT, typename... OPERATORS>


void call_operators_with_statistics(CONTEXT lattice, bool* subdomain, OPERATORS... ops) __global__ {

  const CellID iCell = blockIdx.x * blockDim.x + threadIdx.x;

  if (!(iCell < lattice.getNcells()) || !subdomain[iCell]) {

    return;

  }

  typename CONTEXT::value_t** statistic = lattice.template getField<descriptors::STATISTIC>();

  int* statisticGenerated = lattice.template getField<descriptors::STATISTIC_GENERATED>()[0];

  CellStatistic<typename CONTEXT::value_t> cellStatistic{-1, -1};

  if ((ops(lattice, iCell, cellStatistic) || ... )) {

    if (cellStatistic) {

      statisticGenerated[iCell] = 1;

      statistic[0][iCell] = cellStatistic.rho;

      statistic[1][iCell] = cellStatistic.uSqr;

    } else {

      statisticGenerated[iCell] = 0;

      statistic[0][iCell] = 0;

      statistic[1][iCell] = 0;

    }

  }

}


template <typename CONTEXT, typename... OPERATORS>


void call_list_operators(CONTEXT lattice,

                         const CellID* indices, std::size_t nIndices,

                         OPERATORS... ops) __global__ {

  const std::size_t iIndex = blockIdx.x * blockDim.x + threadIdx.x;

  if (!(iIndex < nIndices)) {

    return;

  }

  (ops(lattice, indices[iIndex]) || ... );

}


template <typename CONTEXT, typename... OPERATORS>


void call_list_operators_with_statistics(CONTEXT lattice,

                                         const CellID* indices, std::size_t nIndices,

                                         OPERATORS... ops) __global__ {

  const std::size_t iIndex = blockIdx.x * blockDim.x + threadIdx.x;

  if (!(iIndex < nIndices)) {

    return;

  }

  typename CONTEXT::value_t** statistic = lattice.template getField<descriptors::STATISTIC>();

  int* statisticGenerated = lattice.template getField<descriptors::STATISTIC_GENERATED>()[0];

  CellStatistic<typename CONTEXT::value_t> cellStatistic{-1, -1};

  if ((ops(lattice, indices[iIndex], cellStatistic) || ... )) {

    if (cellStatistic) {

      statisticGenerated[indices[iIndex]] = 1;

      statistic[0][indices[iIndex]] = cellStatistic.rho;

      statistic[1][indices[iIndex]] = cellStatistic.uSqr;

    } else {

      statisticGenerated[indices[iIndex]] = 0;

      statistic[0][indices[iIndex]] = 0;

      statistic[1][indices[iIndex]] = 0;

    }

  }

}


template <typename CONTEXTS, typename... OPERATORS>


void call_coupling_operators(CONTEXTS lattices, bool* subdomain, OPERATORS... ops) __global__ {

  const CellID iCell = blockIdx.x * blockDim.x + threadIdx.x;

  const auto nCells = lattices.template get<0>().getNcells();

  if (!(iCell < nCells) || !subdomain[iCell]) {

    return;

  }

  (ops(lattices, iCell) || ... );

}


template <typename T, typename DESCRIPTOR, typename DYNAMICS, typename PARAMETERS=typename DYNAMICS::ParametersD>


void construct_dynamics(void* target, PARAMETERS* parameters) __global__ {

  new (target) ConcreteDynamics<T,DESCRIPTOR,DYNAMICS>(parameters);

}


}


template <typename CONTEXT, typename... ARGS>


void call_operators(CONTEXT& lattice, bool* subdomain, ARGS&&... args) {

  const auto block_size = 32;

  const auto block_count = (lattice.getNcells() + block_size - 1) / block_size;

  kernel::call_operators<CONTEXT,ARGS...><<<block_count,block_size>>>(

    lattice, subdomain, std::forward<decltype(args)>(args)...);

  device::check();

}


template <typename CONTEXT, typename... ARGS>


void async_call_operators(cudaStream_t stream, CONTEXT& lattice, bool* subdomain, ARGS&&... args) {

  const auto block_size = 32;

  const auto block_count = (lattice.getNcells() + block_size - 1) / block_size;

  kernel::call_operators<CONTEXT,ARGS...><<<block_count,block_size,0,stream>>>(

    lattice, subdomain, std::forward<decltype(args)>(args)...);

  device::check();

}


template <typename CONTEXT, typename... ARGS>


void call_operators_with_statistics(CONTEXT& lattice, bool* subdomain, ARGS&&... args) {

  const auto block_size = 32;

  const auto block_count = (lattice.getNcells() + block_size - 1) / block_size;

  kernel::call_operators_with_statistics<CONTEXT,ARGS...><<<block_count,block_size>>>(

    lattice, subdomain, std::forward<decltype(args)>(args)...);

  device::check();

}


template <typename CONTEXT, typename... ARGS>


void async_call_operators_with_statistics(cudaStream_t stream, CONTEXT& lattice, bool* subdomain, ARGS&&... args) {

  const auto block_size = 32;

  const auto block_count = (lattice.getNcells() + block_size - 1) / block_size;

  kernel::call_operators_with_statistics<CONTEXT,ARGS...><<<block_count,block_size,0,stream>>>(

    lattice, subdomain, std::forward<decltype(args)>(args)...);

  device::check();

}


template <typename CONTEXT, typename... ARGS>


void call_list_operators(CONTEXT& lattice,

                         const gpu::cuda::Column<CellID>& cells,

                         ARGS&&... args) {

  const auto block_size = 32;

  const auto block_count = (cells.size() + block_size - 1) / block_size;

  kernel::call_list_operators<CONTEXT,ARGS...><<<block_count, block_size>>>(

    lattice,

    cells.deviceData(), cells.size(),

    std::forward<decltype(args)>(args)...);

  device::check();

}


template <typename CONTEXT, typename... ARGS>


void async_call_list_operators(cudaStream_t stream,

                               CONTEXT& lattice,

                               const gpu::cuda::Column<CellID>& cells,

                               ARGS&&... args) {

  const auto block_size = 32;

  const auto block_count = (cells.size() + block_size - 1) / block_size;

  kernel::call_list_operators<<<block_count,block_size,0,stream>>>(

    lattice,

    cells.deviceData(), cells.size(),

    std::forward<decltype(args)>(args)...);

  device::check();

}


template <typename CONTEXT, typename... ARGS>


void async_call_list_operators_with_statistics(cudaStream_t stream,

                                               CONTEXT& lattice,

                                               const gpu::cuda::Column<CellID>& cells,

                                               ARGS&&... args) {

  const auto block_size = 32;

  const auto block_count = (cells.size() + block_size - 1) / block_size;

  kernel::call_list_operators_with_statistics<<<block_count,block_size,0,stream>>>(

    lattice,

    cells.deviceData(), cells.size(),

    std::forward<decltype(args)>(args)...);

  device::check();

}


template <typename CONTEXT, typename... ARGS>


void call_coupling_operators(CONTEXT& lattices, bool* subdomain, ARGS&&... args) {

  const auto nCells = lattices.template get<0>().getNcells();

  const auto block_size = 32;

  const auto block_count = (nCells + block_size - 1) / block_size;

  kernel::call_coupling_operators<CONTEXT,ARGS...><<<block_count,block_size>>>(

    lattices, subdomain, std::forward<decltype(args)>(args)...);

  device::check();

}


}


}


template <typename T, typename DESCRIPTOR, typename DYNAMICS>


ConcreteBlockCollisionO<T,DESCRIPTOR,Platform::GPU_CUDA,DYNAMICS>::ConcreteBlockCollisionO():

  _dynamics(new DYNAMICS()),

  _parameters(nullptr),

  _mask(nullptr),

  _cells(0),

  _modified(true),

  _stream(cudaStreamDefault)

{ }


template <typename T, typename DESCRIPTOR, typename DYNAMICS>

void ConcreteBlockCollisionO<T,DESCRIPTOR,Platform::GPU_CUDA,DYNAMICS>::applyDominant(

  ConcreteBlockLattice<T,DESCRIPTOR,Platform::GPU_CUDA>& block,

  ConcreteBlockMask<T,Platform::GPU_CUDA>&               subdomain)

{

  using namespace gpu::cuda;

  DeviceContext<T,DESCRIPTOR> lattice(block);

  if (block.statisticsEnabled()) {

    call_operators_with_statistics(

      lattice,

      subdomain.deviceData(),

      MaskedCollision<T,DESCRIPTOR,DYNAMICS>{_parameters->parameters, _mask->deviceData()},

      DynamicDispatchCollision{});

  } else {

    call_operators(

      lattice,

      subdomain.deviceData(),

      MaskedCollision<T,DESCRIPTOR,DYNAMICS>{_parameters->parameters, _mask->deviceData()},

      DynamicDispatchCollision{});

  }

}


template <typename T, typename DESCRIPTOR, typename DYNAMICS>

void ConcreteBlockCollisionO<T,DESCRIPTOR,Platform::GPU_CUDA,DYNAMICS>::applyIndividual(

  ConcreteBlockLattice<T,DESCRIPTOR,Platform::GPU_CUDA>& block,

  ConcreteBlockMask<T,Platform::GPU_CUDA>&               subdomain)

{

  using namespace gpu::cuda;

  DeviceContext<T,DESCRIPTOR> lattice(block);

  // Primitive heuristic for preferring mask-based to list-based dispatch

  if (_mask->weight() > 0.5*subdomain.weight()) {

    if (block.statisticsEnabled()) {

      async_call_operators_with_statistics(

        _stream.get(),

        lattice,

        subdomain.deviceData(),

        MaskedCollision<T,DESCRIPTOR,DYNAMICS>{_parameters->parameters, _mask->deviceData()});

    } else {

      async_call_operators(

        _stream.get(),

        lattice,

        subdomain.deviceData(),

        MaskedCollision<T,DESCRIPTOR,DYNAMICS>{_parameters->parameters, _mask->deviceData()});

    }


  // Use list of cell indices

  } else {

    // Update cell list from mask

    if (_modified) {

      _cells.clear();

      for (CellID iCell=0; iCell  < block.getNcells(); ++iCell) {

        if (_mask->operator[](iCell)) {

          _cells.push_back(iCell);

        }

      }

      _cells.setProcessingContext(ProcessingContext::Simulation);

      _modified = false;

    }


    if (block.statisticsEnabled()) {

      async_call_list_operators_with_statistics(

        _stream.get(),

        lattice,

        _cells,

        ListedCollision<T,DESCRIPTOR,DYNAMICS>{_parameters->parameters});

    } else {

      async_call_list_operators(

        _stream.get(),

        lattice,

        _cells,

        ListedCollision<T,DESCRIPTOR,DYNAMICS>{_parameters->parameters});

    }

  }

}


template <typename T, typename DESCRIPTOR, typename DYNAMICS>


void ConcreteBlockCollisionO<T,DESCRIPTOR,Platform::GPU_CUDA,DYNAMICS>::setup(

  ConcreteBlockLattice<T,DESCRIPTOR,Platform::GPU_CUDA>& block)

{

  // Fetch pointers to DYNAMICS-specific parameter and mask data

  _parameters = &block.template getData<OperatorParameters<DYNAMICS>>();

  _mask = &block.template getData<DynamicsMask<DYNAMICS>>();


  {

    // Construct on-device dynamics proxy for dynamic dispatch

    _deviceDynamics = gpu::cuda::device::malloc<gpu::cuda::ConcreteDynamics<T,DESCRIPTOR,DYNAMICS>>(1);

    gpu::cuda::kernel::construct_dynamics<T,DESCRIPTOR,DYNAMICS><<<1,1>>>(

      _deviceDynamics.get(),

      _parameters->deviceData());

    gpu::cuda::device::check();


    // Fetch pointer to on-device dynamic-dispatch field

    _dynamicsOfCells = block.template getField<gpu::cuda::DYNAMICS<T,DESCRIPTOR>>()[0].data();

  }

}


template <typename T, typename DESCRIPTOR, typename OPERATOR>


ConcreteBlockO<T,DESCRIPTOR,Platform::GPU_CUDA,OPERATOR,OperatorScope::PerCell>::ConcreteBlockO():

  _cells(0),

  _modified{false},

  _stream{cudaStreamDefault}

{ }


template <typename T, typename DESCRIPTOR, typename OPERATOR>


void ConcreteBlockO<T,DESCRIPTOR,Platform::GPU_CUDA,OPERATOR,OperatorScope::PerCell>::apply(

  ConcreteBlockLattice<T,DESCRIPTOR,Platform::GPU_CUDA>& block)

{

  if (_cells.size() > 0) {

    if (_modified) {

      _cells.deduplicate();

      _cells.setProcessingContext(ProcessingContext::Simulation);

      _modified = false;

    }

    gpu::cuda::DeviceBlockLattice<T,DESCRIPTOR> lattice(block);

    gpu::cuda::async_call_list_operators(_stream.get(),

                                         lattice,

                                         _cells,

                                         gpu::cuda::ListedPostProcessor<OPERATOR>{});

  }

}


template <typename T, typename DESCRIPTOR, typename OPERATOR>


ConcreteBlockO<T,DESCRIPTOR,Platform::GPU_CUDA,OPERATOR,OperatorScope::PerCellWithParameters>::ConcreteBlockO():

  _cells(0),

  _modified{false},

  _stream{cudaStreamDefault}

{ }


template <typename T, typename DESCRIPTOR, typename OPERATOR>


void ConcreteBlockO<T,DESCRIPTOR,Platform::GPU_CUDA,OPERATOR,OperatorScope::PerCellWithParameters>::apply(

  ConcreteBlockLattice<T,DESCRIPTOR,Platform::GPU_CUDA>& block)

{

  if (_cells.size() > 0) {

    if (_modified) {

      _cells.deduplicate();

      _cells.setProcessingContext(ProcessingContext::Simulation);

      _modified = false;

    }

    using namespace gpu::cuda;

    DeviceBlockLattice<T,DESCRIPTOR> lattice(block);

    async_call_list_operators(_stream.get(),

                              lattice,

                              _cells,

                              ListedPostProcessorWithParameters<T,DESCRIPTOR,OPERATOR>{_parameters->parameters});

  }

}


template <typename COUPLER, typename COUPLEES>


void ConcreteBlockCouplingO<COUPLEES,Platform::GPU_CUDA,COUPLER,OperatorScope::PerCell>::set(

  CellID iCell, bool state)

{

  if (!_mask) {

    _mask = std::make_unique<ConcreteBlockMask<typename COUPLEES::values_t::template get<0>::value_t,

                                               Platform::GPU_CUDA>>(

      _lattices.template get<0>()->template getData<CollisionSubdomainMask>()

    );

  }

  _mask->set(iCell, state);

}


template <typename COUPLER, typename COUPLEES>


void ConcreteBlockCouplingO<COUPLEES,Platform::GPU_CUDA,COUPLER,OperatorScope::PerCell>::execute()

{

  auto deviceLattice = _lattices.exchange_values([&](auto name) -> auto {

    return gpu::cuda::DeviceBlockLattice{*_lattices.get(name)};

  });

  if (_mask) {

    _mask->setProcessingContext(ProcessingContext::Simulation);

    gpu::cuda::call_coupling_operators(

      deviceLattice, _mask->deviceData(),

      gpu::cuda::UnmaskedCoupling<COUPLER>{});

  } else {

    auto& mask = _lattices.template get<0>()->template getData<CollisionSubdomainMask>();

    gpu::cuda::call_coupling_operators(

      deviceLattice, mask.deviceData(),

      gpu::cuda::UnmaskedCoupling<COUPLER>{});

  }

}


template <typename COUPLER, typename COUPLEES>


void ConcreteBlockCouplingO<COUPLEES,Platform::GPU_CUDA,COUPLER,OperatorScope::PerCellWithParameters>::set(

  CellID iCell, bool state)

{

  if (!_mask) {

    _mask = std::make_unique<ConcreteBlockMask<typename COUPLEES::values_t::template get<0>::value_t,

                                               Platform::GPU_CUDA>>(

      _lattices.template get<0>()->template getData<CollisionSubdomainMask>()

    );

  }

  _mask->set(iCell, state);

}


template <typename COUPLER, typename COUPLEES>


void ConcreteBlockCouplingO<COUPLEES,Platform::GPU_CUDA,COUPLER,OperatorScope::PerCellWithParameters>::execute()

{

  auto deviceLattice = _lattices.exchange_values([&](auto name) -> auto {

    return gpu::cuda::DeviceBlockLattice{*_lattices.get(name)};

  });

  if (_mask) {

    _mask->setProcessingContext(ProcessingContext::Simulation);

    gpu::cuda::call_coupling_operators(

      deviceLattice, _mask->deviceData(),

      gpu::cuda::UnmaskedCouplingWithParameters<COUPLER,COUPLEES>{_parameters});

  } else {

    auto& mask = _lattices.template get<0>()->template getData<CollisionSubdomainMask>();

    gpu::cuda::call_coupling_operators(

      deviceLattice, mask.deviceData(),

      gpu::cuda::UnmaskedCouplingWithParameters<COUPLER,COUPLEES>{_parameters});

  }

}


}


#endif

olb::BlockLattice::statisticsEnabled
bool statisticsEnabled() const
Definition blockLattice.h:210

olb::ConcreteBlockCollisionO
Collision operation of concrete DYNAMICS on concrete block lattices of PLATFORM.
Definition blockDynamicsMap.h:40

olb::ConcreteBlockCouplingO
Coupling of COUPLEES using concrete OPERATOR with SCOPE on PLATFORM lattices.
Definition operator.h:142

olb::ConcreteBlockLattice
Implementation of BlockLattice on a concrete PLATFORM.
Definition blockLattice.h:464

olb::ConcreteBlockMask
Definition blockDynamicsMap.h:39

olb::ConcreteBlockO
Block application of concrete OPERATOR called using SCOPE on PLATFORM.
Definition operator.h:65

olb::gpu::cuda::Cell
Device-side implementation of the Cell concept for post processors.
Definition context.hh:248

olb::gpu::cuda::Column
Plain column for CUDA GPU targets.
Definition column.h:49

olb::gpu::cuda::Column::deviceData
const T * deviceData() const
Definition column.hh:146

olb::gpu::cuda::Column::size
std::size_t size() const
Definition column.hh:128

olb::gpu::cuda::ConcreteDynamics
Implementation of gpu::cuda::Dynamics for concrete DYNAMICS.
Definition dynamics.hh:81

olb::gpu::cuda::DataOnlyCell
Device-side implementation of the data-only Cell concept for collision steps.
Definition context.hh:140

olb::gpu::cuda::DeviceBlockLattice
Device-side view of a block lattice.
Definition context.hh:207

olb::gpu::cuda::DeviceBlockLattice::get
Cell< T, DESCRIPTOR > get(CellID iCell) __device__
Definition context.hh:233

olb::gpu::cuda::DeviceContext
Structure for passing pointers to on-device data into CUDA kernels.
Definition context.hh:55

olb::gpu::cuda::ListedCollision
List-based application of DYNAMICS::apply for use in kernel::call_list_operators.
Definition operator.hh:93

olb::gpu::cuda::ListedCollision::operator()
bool operator()(DeviceContext< T, DESCRIPTOR > &lattice, CellID iCell) __device__
Definition operator.hh:102

olb::gpu::cuda::ListedCollision::operator()
bool operator()(DeviceContext< T, DESCRIPTOR > &lattice, CellID iCell, CellStatistic< T > &statistic) __device__
Definition operator.hh:108

olb::gpu::cuda::ListedCollision::ListedCollision
ListedCollision(ParametersOfOperatorD< T, DESCRIPTOR, DYNAMICS > &parameters) __host__
Definition operator.hh:98

olb::gpu::cuda::ListedPostProcessorWithParameters
List-based application of OPERATOR::apply with parameters.
Definition operator.hh:158

olb::gpu::cuda::ListedPostProcessorWithParameters::operator()
bool operator()(DeviceBlockLattice< T, DESCRIPTOR > &lattice, CellID iCell) __device__
Definition operator.hh:167

olb::gpu::cuda::ListedPostProcessorWithParameters::ListedPostProcessorWithParameters
ListedPostProcessorWithParameters(ParametersOfOperatorD< T, DESCRIPTOR, OPERATOR > &parameters) __host__
Definition operator.hh:163

olb::gpu::cuda::MaskedCollision
Masked application of DYNAMICS::apply for use in kernel::call_operators.
Definition operator.hh:45

olb::gpu::cuda::MaskedCollision::operator()
bool operator()(DeviceContext< T, DESCRIPTOR > &lattice, CellID iCell) __device__
Chainable call operator for use in kernel::call_operators.
Definition operator.hh:72

olb::gpu::cuda::MaskedCollision::MaskedCollision
MaskedCollision(ParametersOfOperatorD< T, DESCRIPTOR, DYNAMICS > &parameters, bool *mask) any_platform
Constructor (commonly called on the host side)
Definition operator.hh:62

olb::gpu::cuda::MaskedCollision::operator()
bool operator()(DeviceContext< T, DESCRIPTOR > &lattice, CellID iCell, CellStatistic< T > &statistic) __device__
Chainable call operator with statistics storage.
Definition operator.hh:81

olb::gpu::cuda::MaskedPostProcessor
Masked application of OPERATOR::apply.
Definition operator.hh:119

olb::gpu::cuda::MaskedPostProcessor::MaskedPostProcessor
MaskedPostProcessor(bool *mask) any_platform
Definition operator.hh:125

olb::gpu::cuda::MaskedPostProcessor::operator()
bool operator()(DeviceBlockLattice< T, DESCRIPTOR > &lattice, CellID iCell) __device__
Definition operator.hh:130

olb::gpu::cuda::UnmaskedCouplingWithParameters
Unrestricted application of COUPLING::apply with parameters.
Definition operator.hh:191

olb::gpu::cuda::UnmaskedCouplingWithParameters::operator()
bool operator()(CONTEXT &lattices, CellID iCell) __device__
Definition operator.hh:204

olb::gpu::cuda::UnmaskedCouplingWithParameters::UnmaskedCouplingWithParameters
UnmaskedCouplingWithParameters(PARAMETERS &parameters) any_platform
Definition operator.hh:199

context.hh

dynamics.hh

olb::gpu::cuda::device::check
void check()
Check errors.
Definition device.hh:48

olb::gpu::cuda::kernel::call_coupling_operators
void call_coupling_operators(CONTEXTS lattices, bool *subdomain, OPERATORS... ops) __global__
CUDA kernel for applying UnmaskedCoupling(WithParameters)
Definition operator.hh:341

olb::gpu::cuda::kernel::call_list_operators
void call_list_operators(CONTEXT lattice, const CellID *indices, std::size_t nIndices, OPERATORS... ops) __global__
CUDA kernel for applying generic OPERATORS with OperatorScope::PerCell or ListedCollision.
Definition operator.hh:301

olb::gpu::cuda::kernel::construct_dynamics
void construct_dynamics(void *target, PARAMETERS *parameters) __global__
CUDA kernel for constructing on-device ConcreteDynamics.
Definition operator.hh:352

olb::gpu::cuda::kernel::call_operators
void call_operators(CONTEXT lattice, bool *subdomain, OPERATORS... ops) __global__
CUDA kernel for applying purely local collision steps.
Definition operator.hh:265

olb::gpu::cuda::kernel::call_list_operators_with_statistics
void call_list_operators_with_statistics(CONTEXT lattice, const CellID *indices, std::size_t nIndices, OPERATORS... ops) __global__
CUDA kernel for applying ListedCollision.
Definition operator.hh:316

olb::gpu::cuda::kernel::call_operators_with_statistics
void call_operators_with_statistics(CONTEXT lattice, bool *subdomain, OPERATORS... ops) __global__
CUDA kernel for applying purely local collision steps while tracking statistics.
Definition operator.hh:278

olb::gpu::cuda::async_call_list_operators
void async_call_list_operators(cudaStream_t stream, CONTEXT &lattice, const gpu::cuda::Column< CellID > &cells, ARGS &&... args)
Apply operators to listed cell indices (async version)
Definition operator.hh:423

olb::gpu::cuda::async_call_operators
void async_call_operators(cudaStream_t stream, CONTEXT &lattice, bool *subdomain, ARGS &&... args)
Apply masked collision operators to lattice (async)
Definition operator.hh:373

olb::gpu::cuda::call_operators
void call_operators(CONTEXT &lattice, bool *subdomain, ARGS &&... args)
Apply masked collision operators to lattice.
Definition operator.hh:363

olb::gpu::cuda::async_call_list_operators_with_statistics
void async_call_list_operators_with_statistics(cudaStream_t stream, CONTEXT &lattice, const gpu::cuda::Column< CellID > &cells, ARGS &&... args)
Apply ListedCollision with statistics (async version)
Definition operator.hh:438

olb::gpu::cuda::async_call_operators_with_statistics
void async_call_operators_with_statistics(cudaStream_t stream, CONTEXT &lattice, bool *subdomain, ARGS &&... args)
Apply masked collision operators to lattice while tracking statistics (async)
Definition operator.hh:396

olb::gpu::cuda::call_list_operators
void call_list_operators(CONTEXT &lattice, const gpu::cuda::Column< CellID > &cells, ARGS &&... args)
Apply operators to listed cell indices.
Definition operator.hh:409

olb::gpu::cuda::getFusedCollisionO
std::function< void(ConcreteBlockLattice< T, DESCRIPTOR, Platform::GPU_CUDA > &) getFusedCollisionO)()
Helper for constructing fused collision operators.
Definition operator.hh:233

olb::gpu::cuda::call_operators_with_statistics
void call_operators_with_statistics(CONTEXT &lattice, bool *subdomain, ARGS &&... args)
Apply masked collision operators to lattice while tracking statistics.
Definition operator.hh:386

olb::gpu::cuda::call_coupling_operators
void call_coupling_operators(CONTEXT &lattices, bool *subdomain, ARGS &&... args)
Apply coupling on subdomain.
Definition operator.hh:453

olb
Top level namespace for all of OpenLB.
Definition boundaryPostProcessors2D.h:34

olb::CellID
std::uint32_t CellID
Type for sequential block-local cell indices.
Definition blockStructure.h:36

olb::ProcessingContext::Simulation
@ Simulation
Data available on host for e.g. functor evaluation.

olb::Platform::GPU_CUDA
@ GPU_CUDA
Vector CPU (AVX2 / AVX-512 collision)

olb::ParametersOfOperatorD
typename ParametersD< T, DESCRIPTOR >::template include< typename OPERATOR::parameters > ParametersOfOperatorD
Deduce ParametersD of OPERATOR w.r.t. T and DESCRIPTOR.
Definition fieldParametersD.h:184

operator.h

any_platform
#define any_platform
Define preprocessor macros for device-side functions, constant storage.
Definition platform.h:78

olb::AbstractCouplingO
Base of block-wide coupling operators executed by SuperLatticeCoupling.
Definition operator.h:115

olb::CellStatistic
Return value of any collision.
Definition interface.h:43

olb::CellStatistic::rho
T rho
Definition interface.h:44

olb::DynamicsMask
Describe mask of DYNAMICS in Data.
Definition data.h:62

olb::gpu::cuda::DYNAMICS
On-device field mirroring BlockDynamicsMap.
Definition dynamics.h:39

olb::gpu::cuda::DynamicDispatchCollision
Last node in a MaskedDynamics chain in kernel::call_operators.
Definition dynamics.hh:148

olb::gpu::cuda::ListedPostProcessor
List-based application of OPERATOR::apply.
Definition operator.hh:146

olb::gpu::cuda::ListedPostProcessor::operator()
bool operator()(DeviceBlockLattice< T, DESCRIPTOR > &lattice, CellID iCell) __device__
Definition operator.hh:148

olb::gpu::cuda::UnmaskedCoupling
Unrestricted application of COUPLING::apply.
Definition operator.hh:177

olb::gpu::cuda::UnmaskedCoupling::operator()
bool operator()(CONTEXT &lattices, CellID iCell) __device__
Definition operator.hh:179