en/latest/bld__mult__cuda__kernels_8hpp_source.html

 #pragma once
 #include "bld_mult_cuda_funcs.hpp"

 namespace bnmf_algs {
 namespace details {
 namespace bld_mult {
 namespace kernel {
 template <typename Real> __device__ Real psi_appr(Real x);

 template <typename Real>
 __global__ void update_grad_plus(cudaPitchedPtr S, const Real* beta_eph,
                                  size_t pitch, cudaPitchedPtr grad_plus,
                                  size_t width, size_t height, size_t depth);

 template <typename Real>
 __global__ void update_nom(cudaPitchedPtr S, const Real* X_reciprocal,
                            size_t X_reciprocal_pitch, const Real* grad_minus,
                            size_t grad_minus_pitch, Real* nom_mult,
                            size_t nom_mult_pitch, size_t width, size_t height,
                            size_t depth);

 template <typename Real>
 __global__ void update_denom(cudaPitchedPtr S, const Real* X_reciprocal,
                              size_t X_reciprocal_pitch,
                              cudaPitchedPtr grad_plus, Real* denom_mult,
                              size_t denom_mult_pitch, size_t width,
                              size_t height, size_t depth);

 template <typename Real>
 __global__ void
 update_S(const Real* X, size_t X_pitch, const Real* nom_mult,
          size_t nom_mult_pitch, const Real* denom_mult, size_t denom_mult_pitch,
          const Real* grad_minus, size_t grad_minus_pitch,
          cudaPitchedPtr grad_plus, const Real* S_ijp, size_t S_ijp_pitch,
          cudaPitchedPtr S, size_t width, size_t height, size_t depth);
 } // namespace kernel
 } // namespace bld_mult
 } // namespace details
 } // namespace bnmf_algs
bnmf_algs::details::bld_mult::kernel::update_denom
__global__ void update_denom(cudaPitchedPtr S, const Real *X_reciprocal, size_t X_reciprocal_pitch, cudaPitchedPtr grad_plus, Real *denom_mult, size_t denom_mult_pitch, size_t width, size_t height, size_t depth)
Perform denom_mult update employed in bld_mult algorithm using tensors/matrices residing on a GPU dev...

bnmf_algs::details::bld_mult::X_reciprocal
matrix_t< T > X_reciprocal(const matrix_t< T > &X, double eps)
Compute the reciprocal  of the input matrix .
Definition: bld_mult_funcs.hpp:87

bld_mult_cuda_funcs.hpp

bnmf_algs::details::bld_mult::kernel::update_grad_plus
__global__ void update_grad_plus(cudaPitchedPtr S, const Real *beta_eph, size_t pitch, cudaPitchedPtr grad_plus, size_t width, size_t height, size_t depth)
Perform grad_plus update employed in bld_mult algorithm using tensors/matrices residing on a GPU devi...

bnmf_algs::bld::bld_mult
tensor_t< T, 3 > bld_mult(const matrix_t< T > &X, const size_t z, const alloc_model::Params< Scalar > &model_params, size_t max_iter=1000, bool use_psi_appr=false, double eps=1e-50)
Compute tensor , the solution of BLD problem , from matrix  using multiplicative update rules...
Definition: bld_mult.hpp:83

bnmf_algs::details::bld_mult::kernel::update_nom
__global__ void update_nom(cudaPitchedPtr S, const Real *X_reciprocal, size_t X_reciprocal_pitch, const Real *grad_minus, size_t grad_minus_pitch, Real *nom_mult, size_t nom_mult_pitch, size_t width, size_t height, size_t depth)
Perform nom_mult update employed in bld_mult algorithm using tensors/matrices residing on a GPU devic...

bnmf_algs::details::bld_mult::kernel::psi_appr
__device__ Real psi_appr(Real x)
Device function to return psi_appr of a real number.
Definition: util.hpp:440

bnmf_algs::details::bld_mult::kernel::update_S
__global__ void update_S(const Real *X, size_t X_pitch, const Real *nom_mult, size_t nom_mult_pitch, const Real *denom_mult, size_t denom_mult_pitch, const Real *grad_minus, size_t grad_minus_pitch, cudaPitchedPtr grad_plus, const Real *S_ijp, size_t S_ijp_pitch, cudaPitchedPtr S, size_t width, size_t height, size_t depth)
Perform S update employed in bld_mult algorithm using tensors/matrices residing on a GPU device...

bnmf_algs
Main namespace for bnmf-algs library.
Definition: alloc_model_funcs.hpp:12