openmp__cuda_8h_source.html

/*

 *            Copyright 2009-2020 The VOTCA Development Team

 *                       (http://www.votca.org)

 *

 *      Licensed under the Apache License, Version 2.0 (the "License")

 *

 * You may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *              http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 *

 */


#pragma once

#ifndef VOTCA_XTP_OPENMP_CUDA_H

#define VOTCA_XTP_OPENMP_CUDA_H


// Local VOTCA includes

#include "eigen.h"


#ifdef USE_CUDA

#include "cudapipeline.h"

#endif


namespace votca {

namespace xtp {


class OpenMP_CUDA {

 public:

  OpenMP_CUDA();

  static Index UsingGPUs();

  static Index AvailableGPUs();

  static void SetNoGPUs(Index number);


  // 3c multiply

  void setOperators(const std::vector<Eigen::MatrixXd>& tensor,

                    const Eigen::MatrixXd& rightoperator);

  void MultiplyRight(Eigen::MatrixXd& matrix, Index OpenmpThread);


  // 3c

  void setOperators(const Eigen::MatrixXd& leftoperator,

                    const Eigen::MatrixXd& rightoperator);

  void MultiplyLeftRight(Eigen::MatrixXd& matrix, Index OpenmpThread);


  // RPA

  void createTemporaries(Index rows, Index cols);

  void PushMatrix(const Eigen::MatrixXd& mat, Index OpenmpThread);

  void A_TDA(const Eigen::VectorXd& vec, Index OpenmpThread);


  // Hd + Hqp + Hd2

  void createTemporaries(const Eigen::VectorXd& vec,

                         const Eigen::MatrixXd& input, Index rows1, Index rows2,

                         Index cols);

  void PrepareMatrix1(Eigen::MatrixXd& mat, Index OpenmpThread);

  void SetTempZero(Index OpenmpThread);

  void PrepareMatrix2(const Eigen::Block<const Eigen::MatrixXd>& mat, bool Hd2,

                      Index OpenmpThread);

  void Addvec(const Eigen::VectorXd& row, Index OpenmpThread);

  void MultiplyRow(Index row, Index OpenmpThread);


  // Hx

  void createAdditionalTemporaries(Index rows, Index cols);

  void PushMatrix1(const Eigen::MatrixXd& mat, Index OpenmpThread);

  void MultiplyBlocks(const Eigen::Block<const Eigen::MatrixXd>& mat, Index i1,

                      Index i2, Index OpenmpThread);


  Eigen::MatrixXd getReductionVar();


 private:

  template <class T>


  class DefaultReference {

   public:

    DefaultReference() = default;

    DefaultReference(T object) : p(&object) {};


    DefaultReference& operator=(const T& object) {

      p = &object;

      return *this;

    }


    const T& operator()() {

      assert(p != nullptr && "Dangling reference!");

      return *p;

    }


   private:

    const T* p = nullptr;

  };


  DefaultReference<const Eigen::MatrixXd> rOP_;

  DefaultReference<const Eigen::MatrixXd> lOP_;

  DefaultReference<const Eigen::VectorXd> vec_;


  struct CPU_data {


    Eigen::MatrixXd& reduce() { return reduce_mat; }


    void InitializeReduce(Index rows, Index cols) {

      reduce_mat = Eigen::MatrixXd::Zero(rows, cols);

    }


    void InitializeVec(Index size) { temp_vec = Eigen::VectorXd::Zero(size); }


    DefaultReference<Eigen::MatrixXd> ref_mat;

    Eigen::MatrixXd temp_mat;

    Eigen::VectorXd temp_vec;

    Eigen::MatrixXd reduce_mat;

  };


  std::vector<CPU_data> cpus_;


  bool inside_Parallel_region_;

  Index threadID_parent_;


  static Index number_of_gpus;


  Index getParentThreadId(Index OpenmpThreadId) const;


  Index getLocalThreadId(Index ParentThreadId) const;


  Index getNumberThreads() const;


#ifdef USE_CUDA

  bool isGPUthread(Index ParentThreadId) const;


  struct GPU_data {


    explicit GPU_data(Index i)

        : Id(i), pipeline(std::make_unique<CudaPipeline>(int(i))) {

      ;

    }


    Index Id;

    std::unique_ptr<CudaPipeline> pipeline;

    std::vector<std::unique_ptr<CudaMatrix>> temp;


    CudaMatrix& Mat(Index i) { return *temp[i]; }

    CudaPipeline& pipe() { return *pipeline; }

    void activateGPU() { checkCuda(cudaSetDevice(pipeline->getDeviceId())); }


    void push_back(const Eigen::MatrixXd& m) {

      temp.push_back(std::make_unique<CudaMatrix>(m, pipeline->get_stream()));

    }

    void push_back(Index rows, Index cols) {

      temp.push_back(

          std::make_unique<CudaMatrix>(rows, cols, pipeline->get_stream()));

    }


    void resize(Index id, Index rows, Index cols) {

      temp[id] =

          std::make_unique<CudaMatrix>(rows, cols, pipeline->get_stream());

    }

  };


  std::vector<GPU_data> gpus_;

  static bool isInVector(Index Id, const std::vector<GPU_data>& vec);

#endif

};


}  // namespace xtp

}  // namespace votca


#endif  // VOTCA_XTP_OPENMP_CUDA_H

votca::xtp::CudaMatrix
Definition cudamatrix.h:104

votca::xtp::CudaPipeline
Definition cudapipeline.h:48

votca::xtp::OpenMP_CUDA::DefaultReference
Definition openmp_cuda.h:111

votca::xtp::OpenMP_CUDA::DefaultReference::operator()
const T & operator()()
Definition openmp_cuda.h:121

votca::xtp::OpenMP_CUDA::DefaultReference::p
const T * p
Definition openmp_cuda.h:127

votca::xtp::OpenMP_CUDA::DefaultReference::operator=
DefaultReference & operator=(const T &object)
Definition openmp_cuda.h:116

votca::xtp::OpenMP_CUDA::DefaultReference::DefaultReference
DefaultReference()=default

votca::xtp::OpenMP_CUDA::DefaultReference::DefaultReference
DefaultReference(T object)
Definition openmp_cuda.h:114

votca::xtp::OpenMP_CUDA::A_TDA
void A_TDA(const Eigen::VectorXd &vec, Index OpenmpThread)
Definition openmp_cuda.cc:235

votca::xtp::OpenMP_CUDA::Addvec
void Addvec(const Eigen::VectorXd &row, Index OpenmpThread)
Definition openmp_cuda.cc:371

votca::xtp::OpenMP_CUDA::getParentThreadId
Index getParentThreadId(Index OpenmpThreadId) const
Definition openmp_cuda.cc:106

votca::xtp::OpenMP_CUDA::PushMatrix1
void PushMatrix1(const Eigen::MatrixXd &mat, Index OpenmpThread)
Definition openmp_cuda.cc:425

votca::xtp::OpenMP_CUDA::MultiplyLeftRight
void MultiplyLeftRight(Eigen::MatrixXd &matrix, Index OpenmpThread)
Definition openmp_cuda.cc:189

votca::xtp::OpenMP_CUDA::cpus_
std::vector< CPU_data > cpus_
Definition openmp_cuda.h:149

votca::xtp::OpenMP_CUDA::getReductionVar
Eigen::MatrixXd getReductionVar()
Definition openmp_cuda.cc:480

votca::xtp::OpenMP_CUDA::SetTempZero
void SetTempZero(Index OpenmpThread)
Definition openmp_cuda.cc:318

votca::xtp::OpenMP_CUDA::MultiplyRight
void MultiplyRight(Eigen::MatrixXd &matrix, Index OpenmpThread)
Definition openmp_cuda.cc:147

votca::xtp::OpenMP_CUDA::createTemporaries
void createTemporaries(Index rows, Index cols)
Definition openmp_cuda.cc:212

votca::xtp::OpenMP_CUDA::setOperators
void setOperators(const std::vector< Eigen::MatrixXd > &tensor, const Eigen::MatrixXd &rightoperator)
Definition openmp_cuda.cc:89

votca::xtp::OpenMP_CUDA::PushMatrix
void PushMatrix(const Eigen::MatrixXd &mat, Index OpenmpThread)
Definition openmp_cuda.cc:218

votca::xtp::OpenMP_CUDA::MultiplyBlocks
void MultiplyBlocks(const Eigen::Block< const Eigen::MatrixXd > &mat, Index i1, Index i2, Index OpenmpThread)
Definition openmp_cuda.cc:442

votca::xtp::OpenMP_CUDA::AvailableGPUs
static Index AvailableGPUs()
Definition openmp_cuda.cc:32

votca::xtp::OpenMP_CUDA::OpenMP_CUDA
OpenMP_CUDA()
Definition openmp_cuda.cc:48

votca::xtp::OpenMP_CUDA::MultiplyRow
void MultiplyRow(Index row, Index OpenmpThread)
Definition openmp_cuda.cc:388

votca::xtp::OpenMP_CUDA::inside_Parallel_region_
bool inside_Parallel_region_
Definition openmp_cuda.h:151

votca::xtp::OpenMP_CUDA::createAdditionalTemporaries
void createAdditionalTemporaries(Index rows, Index cols)
Definition openmp_cuda.cc:422

votca::xtp::OpenMP_CUDA::PrepareMatrix2
void PrepareMatrix2(const Eigen::Block< const Eigen::MatrixXd > &mat, bool Hd2, Index OpenmpThread)
Definition openmp_cuda.cc:334

votca::xtp::OpenMP_CUDA::SetNoGPUs
static void SetNoGPUs(Index number)
Definition openmp_cuda.cc:40

votca::xtp::OpenMP_CUDA::threadID_parent_
Index threadID_parent_
Definition openmp_cuda.h:152

votca::xtp::OpenMP_CUDA::getLocalThreadId
Index getLocalThreadId(Index ParentThreadId) const
Definition openmp_cuda.cc:109

votca::xtp::OpenMP_CUDA::UsingGPUs
static Index UsingGPUs()
Definition openmp_cuda.cc:30

votca::xtp::OpenMP_CUDA::rOP_
DefaultReference< const Eigen::MatrixXd > rOP_
Definition openmp_cuda.h:130

votca::xtp::OpenMP_CUDA::lOP_
DefaultReference< const Eigen::MatrixXd > lOP_
Definition openmp_cuda.h:131

votca::xtp::OpenMP_CUDA::number_of_gpus
static Index number_of_gpus
Definition openmp_cuda.h:154

votca::xtp::OpenMP_CUDA::getNumberThreads
Index getNumberThreads() const
Definition openmp_cuda.cc:112

votca::xtp::OpenMP_CUDA::vec_
DefaultReference< const Eigen::VectorXd > vec_
Definition openmp_cuda.h:132

votca::xtp::OpenMP_CUDA::PrepareMatrix1
void PrepareMatrix1(Eigen::MatrixXd &mat, Index OpenmpThread)
Definition openmp_cuda.cc:299

cudapipeline.h

std
STL namespace.

votca
base class for all analysis tools
Definition basebead.h:33

votca::Index
Eigen::Index Index
Definition types.h:26

votca::xtp::OpenMP_CUDA::CPU_data
Definition openmp_cuda.h:134

votca::xtp::OpenMP_CUDA::CPU_data::ref_mat
DefaultReference< Eigen::MatrixXd > ref_mat
Definition openmp_cuda.h:143

votca::xtp::OpenMP_CUDA::CPU_data::reduce
Eigen::MatrixXd & reduce()
Definition openmp_cuda.h:136

votca::xtp::OpenMP_CUDA::CPU_data::temp_mat
Eigen::MatrixXd temp_mat
Definition openmp_cuda.h:144

votca::xtp::OpenMP_CUDA::CPU_data::temp_vec
Eigen::VectorXd temp_vec
Definition openmp_cuda.h:145

votca::xtp::OpenMP_CUDA::CPU_data::reduce_mat
Eigen::MatrixXd reduce_mat
Definition openmp_cuda.h:146

votca::xtp::OpenMP_CUDA::CPU_data::InitializeReduce
void InitializeReduce(Index rows, Index cols)
Definition openmp_cuda.h:137

votca::xtp::OpenMP_CUDA::CPU_data::InitializeVec
void InitializeVec(Index size)
Definition openmp_cuda.h:141

eigen.h