PLSSVM/backends_2CUDA_2csvm_8hpp_source.html

 #ifndef PLSSVM_BACKENDS_CUDA_CSVM_HPP_

 #define PLSSVM_BACKENDS_CUDA_CSVM_HPP_

 #pragma once


 #include "plssvm/backends/CUDA/detail/device_ptr.cuh"  // plssvm::cuda::detail::device_ptr

 #include "plssvm/backends/gpu_csvm.hpp"                // plssvm::detail::gpu_csvm

 #include "plssvm/parameter.hpp"                        // plssvm::parameter, plssvm::detail::parameter

 #include "plssvm/target_platforms.hpp"                 // plssvm::target_platform


 #include <cstddef>                                     // std::size_t

 #include <type_traits>                                 // std::true_type

 #include <utility>                                     // std::forward


 namespace plssvm {


 namespace detail {


 // forward declare execution_range class

 class execution_range;


 }  // namespace detail


 namespace cuda {


 class csvm : public ::plssvm::detail::gpu_csvm<detail::device_ptr, int> {

   protected:

     // protected for the test mock class

     using base_type = ::plssvm::detail::gpu_csvm<detail::device_ptr, int>;


     using base_type::devices_;


   public:

     using base_type::device_ptr_type;

     using typename base_type::queue_type;


     explicit csvm(parameter params = {});

     explicit csvm(target_platform target, parameter params = {});


     template <typename... Args, PLSSVM_REQUIRES(::plssvm::detail::has_only_parameter_named_args_v<Args...>)>

     explicit csvm(Args &&...named_args) :

         csvm{ plssvm::target_platform::automatic, std::forward<Args>(named_args)... } {}

     template <typename... Args, PLSSVM_REQUIRES(::plssvm::detail::has_only_parameter_named_args_v<Args...>)>

     explicit csvm(const target_platform target, Args &&...named_args) :

         base_type{ std::forward<Args>(named_args)... } {

         this->init(target);

     }


     csvm(const csvm &) = delete;

     csvm(csvm &&) noexcept = default;

     csvm &operator=(const csvm &) = delete;

     csvm &operator=(csvm &&) noexcept = default;

     ~csvm() override;


   protected:

     void device_synchronize(const queue_type &queue) const final;


     void run_q_kernel(std::size_t device, const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter<float> &params, device_ptr_type<float> &q_d, const device_ptr_type<float> &data_d, const device_ptr_type<float> &data_last_d, std::size_t num_data_points_padded, std::size_t num_features) const final { this->run_q_kernel_impl(device, range, params, q_d, data_d, data_last_d, num_data_points_padded, num_features); }

     void run_q_kernel(std::size_t device, const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter<double> &params, device_ptr_type<double> &q_d, const device_ptr_type<double> &data_d, const device_ptr_type<double> &data_last_d, std::size_t num_data_points_padded, std::size_t num_features) const final { this->run_q_kernel_impl(device, range, params, q_d, data_d, data_last_d, num_data_points_padded, num_features); }

     template <typename real_type>

     void run_q_kernel_impl(std::size_t device, const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter<real_type> &params, device_ptr_type<real_type> &q_d, const device_ptr_type<real_type> &data_d, const device_ptr_type<real_type> &data_last_d, std::size_t num_data_points_padded, std::size_t num_features) const;

     void run_svm_kernel(std::size_t device, const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter<float> &params, const device_ptr_type<float> &q_d, device_ptr_type<float> &r_d, const device_ptr_type<float> &x_d, const device_ptr_type<float> &data_d, float QA_cost, float add, std::size_t num_data_points_padded, std::size_t num_features) const final { this->run_svm_kernel_impl(device, range, params, q_d, r_d, x_d, data_d, QA_cost, add, num_data_points_padded, num_features); }

     void run_svm_kernel(std::size_t device, const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter<double> &params, const device_ptr_type<double> &q_d, device_ptr_type<double> &r_d, const device_ptr_type<double> &x_d, const device_ptr_type<double> &data_d, double QA_cost, double add, std::size_t num_data_points_padded, std::size_t num_features) const final { this->run_svm_kernel_impl(device, range, params, q_d, r_d, x_d, data_d, QA_cost, add, num_data_points_padded, num_features); }

     template <typename real_type>

     void run_svm_kernel_impl(std::size_t device, const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter<real_type> &params, const device_ptr_type<real_type> &q_d, device_ptr_type<real_type> &r_d, const device_ptr_type<real_type> &x_d, const device_ptr_type<real_type> &data_d, real_type QA_cost, real_type add, std::size_t num_data_points_padded, std::size_t num_features) const;

     void run_w_kernel(std::size_t device, const ::plssvm::detail::execution_range &range, device_ptr_type<float> &w_d, const device_ptr_type<float> &alpha_d, const device_ptr_type<float> &data_d, const device_ptr_type<float> &data_last_d, std::size_t num_data_points, std::size_t num_features) const final { this->run_w_kernel_impl(device, range, w_d, alpha_d, data_d, data_last_d, num_data_points, num_features); }

     void run_w_kernel(std::size_t device, const ::plssvm::detail::execution_range &range, device_ptr_type<double> &w_d, const device_ptr_type<double> &alpha_d, const device_ptr_type<double> &data_d, const device_ptr_type<double> &data_last_d, std::size_t num_data_points, std::size_t num_features) const final { this->run_w_kernel_impl(device, range, w_d, alpha_d, data_d, data_last_d, num_data_points, num_features); }

     template <typename real_type>

     void run_w_kernel_impl(std::size_t device, const ::plssvm::detail::execution_range &range, device_ptr_type<real_type> &w_d, const device_ptr_type<real_type> &alpha_d, const device_ptr_type<real_type> &data_d, const device_ptr_type<real_type> &data_last_d, std::size_t num_data_points, std::size_t num_features) const;

     void run_predict_kernel(const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter<float> &params, device_ptr_type<float> &out_d, const device_ptr_type<float> &alpha_d, const device_ptr_type<float> &point_d, const device_ptr_type<float> &data_d, const device_ptr_type<float> &data_last_d, std::size_t num_support_vectors, std::size_t num_predict_points, std::size_t num_features) const final { this->run_predict_kernel_impl(range, params, out_d, alpha_d, point_d, data_d, data_last_d, num_support_vectors, num_predict_points, num_features); }

     void run_predict_kernel(const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter<double> &params, device_ptr_type<double> &out_d, const device_ptr_type<double> &alpha_d, const device_ptr_type<double> &point_d, const device_ptr_type<double> &data_d, const device_ptr_type<double> &data_last_d, std::size_t num_support_vectors, std::size_t num_predict_points, std::size_t num_features) const final { this->run_predict_kernel_impl(range, params, out_d, alpha_d, point_d, data_d, data_last_d, num_support_vectors, num_predict_points, num_features); }

     template <typename real_type>

     void run_predict_kernel_impl(const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter<real_type> &params, device_ptr_type<real_type> &out_d, const device_ptr_type<real_type> &alpha_d, const device_ptr_type<real_type> &point_d, const device_ptr_type<real_type> &data_d, const device_ptr_type<real_type> &data_last_d, std::size_t num_support_vectors, std::size_t num_predict_points, std::size_t num_features) const;


   private:

     void init(target_platform target);

 };


 }  // namespace cuda


 namespace detail {


 template <>

 struct csvm_backend_exists<cuda::csvm> : std::true_type {};


 }  // namespace detail


 }  // namespace plssvm


 #endif  // PLSSVM_BACKENDS_CUDA_CSVM_HPP_

plssvm::csvm
Base class for all C-SVM backends.
Definition: csvm.hpp:50

plssvm::cuda::csvm
A C-SVM implementation using CUDA as backend.
Definition: csvm.hpp:39

plssvm::cuda::csvm::device_synchronize
void device_synchronize(const queue_type &queue) const final
Synchronize the device denoted by queue.

plssvm::cuda::csvm::run_predict_kernel
void run_predict_kernel(const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter< double > &params, device_ptr_type< double > &out_d, const device_ptr_type< double > &alpha_d, const device_ptr_type< double > &point_d, const device_ptr_type< double > &data_d, const device_ptr_type< double > &data_last_d, std::size_t num_support_vectors, std::size_t num_predict_points, std::size_t num_features) const final
Run the device kernel (only on the first device) to predict the new data points point_d.
Definition: csvm.hpp:171

plssvm::cuda::csvm::run_q_kernel
void run_q_kernel(std::size_t device, const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter< double > &params, device_ptr_type< double > &q_d, const device_ptr_type< double > &data_d, const device_ptr_type< double > &data_last_d, std::size_t num_data_points_padded, std::size_t num_features) const final
Run the device kernel filling the q vector.
Definition: csvm.hpp:132

plssvm::cuda::csvm::csvm
csvm(target_platform target, parameter params={})
Construct a new C-SVM using the CUDA backend on the target platform with the parameters given through...

plssvm::cuda::csvm::csvm
csvm(csvm &&) noexcept=default
Default move-constructor since a virtual destructor has been declared. noexcept

plssvm::cuda::csvm::run_q_kernel_impl
void run_q_kernel_impl(std::size_t device, const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter< real_type > &params, device_ptr_type< real_type > &q_d, const device_ptr_type< real_type > &data_d, const device_ptr_type< real_type > &data_last_d, std::size_t num_data_points_padded, std::size_t num_features) const
Run the device kernel filling the q vector.

plssvm::cuda::csvm::csvm
csvm(const csvm &)=delete
Delete copy-constructor since a CSVM is a move-only type.

plssvm::cuda::csvm::init
void init(target_platform target)
Initialize all important states related to the CUDA backend.

plssvm::cuda::csvm::run_w_kernel_impl
void run_w_kernel_impl(std::size_t device, const ::plssvm::detail::execution_range &range, device_ptr_type< real_type > &w_d, const device_ptr_type< real_type > &alpha_d, const device_ptr_type< real_type > &data_d, const device_ptr_type< real_type > &data_last_d, std::size_t num_data_points, std::size_t num_features) const
Run the device kernel the calculate the w vector used to speed up the prediction when using the linea...

plssvm::cuda::csvm::run_svm_kernel_impl
void run_svm_kernel_impl(std::size_t device, const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter< real_type > &params, const device_ptr_type< real_type > &q_d, device_ptr_type< real_type > &r_d, const device_ptr_type< real_type > &x_d, const device_ptr_type< real_type > &data_d, real_type QA_cost, real_type add, std::size_t num_data_points_padded, std::size_t num_features) const
Run the main device kernel used in the CG algorithm.

plssvm::cuda::csvm::run_predict_kernel_impl
void run_predict_kernel_impl(const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter< real_type > &params, device_ptr_type< real_type > &out_d, const device_ptr_type< real_type > &alpha_d, const device_ptr_type< real_type > &point_d, const device_ptr_type< real_type > &data_d, const device_ptr_type< real_type > &data_last_d, std::size_t num_support_vectors, std::size_t num_predict_points, std::size_t num_features) const
Run the device kernel (only on the first device) to predict the new data points point_d.

plssvm::cuda::csvm::csvm
csvm(Args &&...named_args)
Construct a new C-SVM using the CUDA backend and the optionally provided named_args.
Definition: csvm.hpp:80

plssvm::cuda::csvm::run_w_kernel
void run_w_kernel(std::size_t device, const ::plssvm::detail::execution_range &range, device_ptr_type< double > &w_d, const device_ptr_type< double > &alpha_d, const device_ptr_type< double > &data_d, const device_ptr_type< double > &data_last_d, std::size_t num_data_points, std::size_t num_features) const final
Run the device kernel the calculate the w vector used to speed up the prediction when using the linea...
Definition: csvm.hpp:158

plssvm::cuda::csvm::run_svm_kernel
void run_svm_kernel(std::size_t device, const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter< float > &params, const device_ptr_type< float > &q_d, device_ptr_type< float > &r_d, const device_ptr_type< float > &x_d, const device_ptr_type< float > &data_d, float QA_cost, float add, std::size_t num_data_points_padded, std::size_t num_features) const final
Run the main device kernel used in the CG algorithm.
Definition: csvm.hpp:141

plssvm::cuda::csvm::run_predict_kernel
void run_predict_kernel(const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter< float > &params, device_ptr_type< float > &out_d, const device_ptr_type< float > &alpha_d, const device_ptr_type< float > &point_d, const device_ptr_type< float > &data_d, const device_ptr_type< float > &data_last_d, std::size_t num_support_vectors, std::size_t num_predict_points, std::size_t num_features) const final
Run the device kernel (only on the first device) to predict the new data points point_d.
Definition: csvm.hpp:167

plssvm::cuda::csvm::run_w_kernel
void run_w_kernel(std::size_t device, const ::plssvm::detail::execution_range &range, device_ptr_type< float > &w_d, const device_ptr_type< float > &alpha_d, const device_ptr_type< float > &data_d, const device_ptr_type< float > &data_last_d, std::size_t num_data_points, std::size_t num_features) const final
Run the device kernel the calculate the w vector used to speed up the prediction when using the linea...
Definition: csvm.hpp:154

plssvm::cuda::csvm::csvm
csvm(parameter params={})
Construct a new C-SVM using the CUDA backend with the parameters given through params.

plssvm::cuda::csvm::run_svm_kernel
void run_svm_kernel(std::size_t device, const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter< double > &params, const device_ptr_type< double > &q_d, device_ptr_type< double > &r_d, const device_ptr_type< double > &x_d, const device_ptr_type< double > &data_d, double QA_cost, double add, std::size_t num_data_points_padded, std::size_t num_features) const final
Run the main device kernel used in the CG algorithm.
Definition: csvm.hpp:145

plssvm::cuda::csvm::run_q_kernel
void run_q_kernel(std::size_t device, const ::plssvm::detail::execution_range &range, const ::plssvm::detail::parameter< float > &params, device_ptr_type< float > &q_d, const device_ptr_type< float > &data_d, const device_ptr_type< float > &data_last_d, std::size_t num_data_points_padded, std::size_t num_features) const final
Run the device kernel filling the q vector.
Definition: csvm.hpp:128

plssvm::cuda::csvm::csvm
csvm(const target_platform target, Args &&...named_args)
Construct a new C-SVM using the CUDA backend on the target platform and the optionally provided named...
Definition: csvm.hpp:92

plssvm::detail::execution_range
Class specifying a backend independent execution range.
Definition: execution_range.hpp:31

plssvm::detail::gpu_csvm
A C-SVM implementation for all GPU backends to reduce code duplication.
Definition: gpu_csvm.hpp:46

plssvm::detail::gpu_csvm< detail::device_ptr, int >::devices_
std::vector< queue_type > devices_
The available/used backend devices.
Definition: gpu_csvm.hpp:280

plssvm::detail::gpu_csvm< detail::device_ptr, int >::queue_type
int queue_type
The type of the device queue (dependent on the used backend).
Definition: gpu_csvm.hpp:52

plssvm::detail::gpu_csvm< detail::device_ptr, int >::device_ptr_type
detail::device_ptr< real_type > device_ptr_type
The type of the device pointer (dependent on the used backend).
Definition: gpu_csvm.hpp:50

device_ptr.cuh
Small wrapper around a CUDA device pointer.

gpu_csvm.hpp
Defines the base class for all C-SVM backends using a GPU. Used for code duplication reduction.

plssvm
The main namespace containing all public API functions.
Definition: backend_types.hpp:24

plssvm::target_platform
target_platform
Enum class for all possible targets.
Definition: target_platforms.hpp:25

plssvm::backend_type::automatic
@ automatic

plssvm::backend_type::cuda
@ cuda

parameter.hpp
Implements the parameter class encapsulating all important C-SVM parameters.

plssvm::csvm_backend_exists
Sets the value of the value member to true if T is a C-SVM using an available backend....
Definition: csvm.hpp:410

plssvm::detail::parameter< double >

target_platforms.hpp
Defines an enumeration holding all possible target platforms. Can also include targets not available ...

PLSSVM_REQUIRES
#define PLSSVM_REQUIRES(...)
A shorthand macro for the std::enable_if_t type trait.
Definition: type_traits.hpp:33