void xGeru<cl_float2>::call_func() { timer.Start(timer_id); clblasCgeru(buffer.order, buffer.M, buffer.N, buffer.alpha, buffer.X, buffer.offx, buffer.incx, buffer.Y, buffer.offy, buffer.incy, buffer.A, buffer.offa, buffer.lda, 1, &queue_, 0, NULL,&event_); clWaitForEvents(1, &event_); timer.Stop(timer_id); }
/** Perform rank-1 update (unconjugated), \f$ A = \alpha x y^H + A \f$. @param[in] m Number of rows of A. m >= 0. @param[in] n Number of columns of A. n >= 0. @param[in] alpha Scalar \f$ \alpha \f$ @param[in] dx COMPLEX array on GPU device. The m element vector x of dimension (1 + (m-1)*incx). @param[in] incx Stride between consecutive elements of dx. incx != 0. @param[in] dy COMPLEX array on GPU device. The n element vector y of dimension (1 + (n-1)*incy). @param[in] incy Stride between consecutive elements of dy. incy != 0. @param[in,out] dA COMPLEX array of dimension (ldda,n), ldda >= max(1,m). The m-by-n matrix A, on GPU device. @param[in] ldda Leading dimension of dA. @ingroup magma_cblas2 */ extern "C" void magma_cgeru( magma_int_t m, magma_int_t n, magmaFloatComplex alpha, magmaFloatComplex_const_ptr dx, size_t dx_offset, magma_int_t incx, magmaFloatComplex_const_ptr dy, size_t dy_offset, magma_int_t incy, magmaFloatComplex_ptr dA, size_t dA_offset, magma_int_t ldda, magma_queue_t queue ) { cl_int err = clblasCgeru( clblasColumnMajor, m, n, alpha, dx, dx_offset, incx, dy, dy_offset, incy, dA, dA_offset, ldda, 1, &queue, 0, NULL, g_event ); check_error( err ); }