43 int dmlsa_cuda(
const int m,
const int n,
const int k,
const double *A,
double *W,
double *H,
const int uType,
const int nIter);
44 int smlsa_cuda(
const int m,
const int n,
const int k,
const float *A,
float *W,
float *H,
const int uType,
const int nIter);
48 void ddotdiv_cuda(
const int n,
const double *x,
const double *y,
double *z, cudaStream_t stream);
49 void sdotdiv_cuda(
const int n,
const float *x,
const float *y,
float *z, cudaStream_t stream);
52 __global__
void vddotdiv_cuda(
const int n,
const double* __restrict__ x,
const double* __restrict__ y,
double *z);
53 __global__
void vsdotdiv_cuda(
const int n,
const float* __restrict__ x,
const float* __restrict__ y,
float *z);
int smlsa_cuda(const int m, const int n, const int k, const float *A, float *W, float *H, const int uType, const int nIter)
Header file for using utility modules from CUDA source codes.
__global__ void vddotdiv_cuda(const int n, const double *__restrict__ x, const double *__restrict__ y, double *z)
int dmlsa_cuda(const int m, const int n, const int k, const double *A, double *W, double *H, const int uType, const int nIter)
void sdotdiv_cuda(const int n, const float *x, const float *y, float *z, cudaStream_t stream)
void ddotdiv_cuda(const int n, const double *x, const double *y, double *z, cudaStream_t stream)
__global__ void vsdotdiv_cuda(const int n, const float *__restrict__ x, const float *__restrict__ y, float *z)