doxygen/master/target_8h_source.html

 // ----------------------------------------------------------------------------
 // openCARP is an open cardiac electrophysiology simulator.
 //
 // Copyright (C) 2020 openCARP project
 //
 // This program is licensed under the openCARP Academic Public License (APL)
 // v1.0: You can use and redistribute it and/or modify it in non-commercial
 // academic environments under the terms of APL as published by the openCARP
 // project v1.0, or (at your option) any later version. Commercial use requires
 // a commercial license (info@opencarp.org).
 //
 // This program is distributed without any warranty; see the openCARP APL for
 // more details.
 //
 // You should have received a copy of the openCARP APL along with this program
 // and can find it online: http://www.opencarp.org/license
 // ----------------------------------------------------------------------------

 #ifndef TARGETS_H
 #define TARGETS_H

 #include <stdexcept>
 #include <iostream>
 #include <string>
 #include <cstring>
 #ifdef HAS_ROCM_MODEL
 #include <hip/hip_runtime.h>
 #endif
 #ifdef HAS_CUDA_MODEL
 #include <cuda_runtime.h>
 #endif

 namespace limpet
 {

 enum Target {
   AUTO = -2,       // !< special value for chosing the target automatically
   UNKNOWN = -1,
   CPU,
   MLIR_CPU,
   MLIR_ROCM,
   MLIR_CUDA,
   N_TARGETS,
 };

 Target get_target_from_string(std::string const str);

 std::string get_string_from_target(Target const target);

 std::string get_target_list_string();

 bool is_gpu(Target const target);

 bool is_concrete(Target const target);

 template <typename T>
 struct TargetAllocator {
   typedef T value_type;

   TargetAllocator(Target target, bool always_managed = false) : _target(target), _always_managed(always_managed) {
     if (!is_concrete(target)) {
       throw std::invalid_argument("attempting to construct a TargetAllocator with an invalid target");
     }
   }

   Target get_target() const {
     return this->_target;
   }

   void set_target(Target new_target) {
     if (!is_concrete(new_target)) {
       throw std::invalid_argument("attempting to set TargetAllocator to an invalid target");
     }
     else {
       this->_target = new_target;
     }
   }

   T* allocate(std::size_t n, bool do_zero = true) {
     using type = typename std::conditional<std::is_void<T>::value, char, T>::type;
     T* ptr = nullptr;
     std::size_t n_bytes = n * sizeof(type);
     switch (this->_target) {
       case Target::MLIR_CPU:
       case Target::CPU: {
         std::allocator<type> std_alloc;
         if(n)
         {
           ptr = std_alloc.allocate(n);
           // Explicitely cast the pointer to silence warning on setting a
           // dynamic class object to 0.
           // The memory allocated by this function should be initialized after,
           // for example by using a placement new
           if(do_zero)
             std::memset((void *) ptr, 0, n_bytes);
         }


         break;
                         }
       case Target::MLIR_ROCM:
 #ifdef HAS_ROCM_MODEL
                         {
         T* hip_ptr;
         hipError_t error;
         // Force usage of HIP managed memory even if it's not supported.
         // This should still preserve the semantics of managed memory, but
         // is slower. It can be useful to allocate small shared data between CPU
         // and GPU.
         if (this->_always_managed) {
           error = hipMallocManaged(&hip_ptr, n_bytes);
         }
         else {
           int device;
           int managed_memory = 0;
           hipGetDevice(&device);
           hipDeviceGetAttribute(&managed_memory, hipDeviceAttributeManagedMemory, device);
           // Check for HIP managed memory and fallback to a normal hipMalloc if
           // it's not supported. It should still allow the CPU to write to GPU memory.
           if (managed_memory) {
             error = hipMallocManaged(&hip_ptr, n_bytes);
           }
           else {
             error = hipMalloc(&hip_ptr, n_bytes);
           }
         }
         if (error != hipSuccess) {
           throw std::runtime_error(hipGetErrorString(error));
         }
         error = hipMemset(hip_ptr, 0, n_bytes);
         if (error != hipSuccess) {
           throw std::runtime_error(hipGetErrorString(error));
         }
         ptr = hip_ptr;
                         }
 #else
         throw std::invalid_argument("target MLIR_ROCM is unavailable");
 #endif
         break;
       case Target::MLIR_CUDA:
 #ifdef HAS_CUDA_MODEL
         {
           T* cuda_ptr;
           cudaError_t error;
           // Always use unified memory for CUDA
           error = cudaMallocManaged(&cuda_ptr, n_bytes);
           if (error != cudaSuccess) {
             throw std::runtime_error(cudaGetErrorString(error));
           }
           error = cudaMemset(cuda_ptr, 0, n_bytes);
           if (error != cudaSuccess) {
             throw std::runtime_error(cudaGetErrorString(error));
           }
           ptr = cuda_ptr;
         }
 #else
         throw std::invalid_argument("target MLIR_CUDA is unavailable");
 #endif
         break;
       default:
         throw std::invalid_argument("unknown allocation target");
     }
     return ptr;
   }

   // Size is not needed
   void deallocate(T* ptr, std::size_t n = 0) {
     using type = typename std::conditional<std::is_void<T>::value, char, T>::type;
     switch (this->_target) {
       case Target::MLIR_CPU:
       case Target::CPU: {
         std::allocator<type> std_alloc;
         std_alloc.deallocate((type*) ptr, n);
       }
         break;
       case Target::MLIR_ROCM:
 #ifdef HAS_ROCM_MODEL
         {
           hipError_t error;
           error = hipFree(ptr);
           if (error != hipSuccess) {
             throw std::runtime_error(hipGetErrorString(error));
           }
         }
 #else
         throw std::invalid_argument("target MLIR_ROCM is unavailable");
 #endif
         break;
       case Target::MLIR_CUDA:
 #ifdef HAS_CUDA_MODEL
         {
           cudaError_t error;
           error = cudaFree(ptr);
           if (error != cudaSuccess) {
             throw std::runtime_error(cudaGetErrorString(error));
           }
         }
 #else
         throw std::invalid_argument("target MLIR_CUDA is unavailable");
 #endif
         break;
       default:
         throw std::invalid_argument("unknown allocation target");
     }
   }

  private:
   Target _target;
   bool _always_managed;
 };

 template<typename T>
 T* allocate_on_target(Target target, std::size_t n, bool always_managed = false, bool do_zero = true) {
   TargetAllocator<T> alloc(target, always_managed);
   return alloc.allocate(n, do_zero);
 }
 template<typename T>
 void deallocate_on_target(Target target, T* ptr) {
   TargetAllocator<T> alloc(target);
   return alloc.deallocate(ptr);
 }

 }  // namespace limpet

 #endif  // TARGETS_H
limpet::AUTO
Definition: target.h:46

limpet
Definition: ap_analyzer.cc:41

limpet::get_string_from_target
std::string get_string_from_target(Target const target)
Get a string representation of a given target.
Definition: target.cc:46

limpet::TargetAllocator::TargetAllocator
TargetAllocator(Target target, bool always_managed=false)
Construct a TargetAllocator.
Definition: target.h:114

limpet::MLIR_CPU
vectorized CPU code generated with MLIR
Definition: target.h:49

limpet::TargetAllocator
Allocator structure for dynamically allocating memory on multiple targets.
Definition: target.h:104

limpet::is_gpu
bool is_gpu(Target const target)
Checks if this is a GPU target.
Definition: target.cc:64

limpet::UNKNOWN
special value to handle unknown targets
Definition: target.h:47

limpet::TargetAllocator::value_type
T value_type
type to allocate
Definition: target.h:105

limpet::get_target_list_string
std::string get_target_list_string()
Returns a string containing the list of available targets.
Definition: target.cc:55

limpet::N_TARGETS
a token to indicate the maximum number of targets
Definition: target.h:52

limpet::is_concrete
bool is_concrete(Target const target)
Checks if target is a real, concrete target.
Definition: target.cc:68

limpet::TargetAllocator::set_target
void set_target(Target new_target)
Set a new target for this allocator.
Definition: target.h:134

limpet::TargetAllocator::get_target
Target get_target() const
Get the target for this allocator.
Definition: target.h:125

limpet::CPU
baseline CPU model generated with the original opencarp code generator
Definition: target.h:48

limpet::MLIR_CUDA
CUDA code for NVIDIA GPUs generated with MLIR.
Definition: target.h:51

limpet::TargetAllocator::allocate
T * allocate(std::size_t n, bool do_zero=true)
Allocate memory for type T.
Definition: target.h:154

limpet::get_target_from_string
Target get_target_from_string(std::string const str)
Returns a value from the Target enum from a given string.
Definition: target.cc:36

limpet::TargetAllocator::deallocate
void deallocate(T *ptr, std::size_t n=0)
Deallocate memory pointed by ptr.
Definition: target.h:250

limpet::Target
Target
enum that represents different targets to run ionic models on.
Definition: target.h:45

limpet::allocate_on_target
T * allocate_on_target(Target target, std::size_t n, bool always_managed=false, bool do_zero=true)
Utility function for allocating memory on a target. See TargetAllocator.
Definition: target.h:304

limpet::deallocate_on_target
void deallocate_on_target(Target target, T *ptr)
Utility function for deallocating memory on a target. See TargetAllocator.
Definition: target.h:318

limpet::MLIR_ROCM
ROCM code for AMD GPUs generated with MLIR.
Definition: target.h:50