本文整理汇总了C++中CLWrapper::getBuffer方法的典型用法代码示例。如果您正苦于以下问题:C++ CLWrapper::getBuffer方法的具体用法?C++ CLWrapper::getBuffer怎么用?C++ CLWrapper::getBuffer使用的例子?那么, 这里精选的方法代码示例或许可以为您提供帮助。您也可以进一步了解该方法所在类CLWrapper
的用法示例。
在下文中一共展示了CLWrapper::getBuffer方法的5个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的C++代码示例。
示例1: THClBlas_dot
float THClBlas_dot(THClState *state, long n,
CLWrapper *xwrapper, long xoffset, long incx,
CLWrapper *ywrapper, long yoffset, long incy)
{
if(n == 1)
{
incx = 1;
incy = 1;
}
if( (n <= INT_MAX) && (incx <= INT_MAX) && (incy <= INT_MAX) )
{
int i_n = (int)n;
int i_incx = (int)incx;
int i_incy = (int)incy;
float result;
cl_int err;
err = clblasSetup();
if (err != CL_SUCCESS) {
THError("clblasSetup() failed with %d", err);
}
CLWrapper *resultWrapper = state->cl->wrap( 1, &result );
float *scratch = new float[i_n];
CLWrapper *scratchWrapper = state->cl->wrap(i_n, scratch);
scratchWrapper->createOnDevice();
resultWrapper->createOnDevice();
cl_event event = NULL;
err = clblasSdot( i_n, resultWrapper->getBuffer(), 0,
xwrapper->getBuffer(), xoffset, i_incx,
ywrapper->getBuffer(), yoffset, i_incy,
scratchWrapper->getBuffer(),
1, state->cl->queue, 0, NULL, &event);
// THCublasCheck(cublasSdot(*state->blasState->current_handle, i_n, x, i_incx, y, i_incy, &result));
// ClDeviceSynchronize();
if (err != CL_SUCCESS) {
THError("clblasSdot() failed with %d", err);
}
else {
/* Wait for calculations to be finished. */
err = clWaitForEvents(1, &event);
}
resultWrapper->copyToHost();
/* Finalize work with clblas. */
clblasTeardown();
delete resultWrapper;
delete scratchWrapper;
delete[] scratch;
return result;
}
THError("Cublas_dot only supports n, incx and incy "
"upto signed integer limits: %d", INT_MAX);
THError("Not implemented");
return -1;
}
示例2: THClBlas_gemm2
void THClBlas_gemm2(THClState *state, char orderchar, char transa, char transb, long m, long n, long k, float alpha,
THClTensor *a, long lda, THClTensor *b, long ldb, float beta,
THClTensor *c, long ldc)
{
StatefulTimer::timeCheck("THClBlas_gemm START");
CLWrapper *aWrapper = THClTensor_wrapper(state, a);
CLWrapper *bWrapper = THClTensor_wrapper(state, b);
CLWrapper *cWrapper = THClTensor_wrapper(state, c);
long offseta = THClTensor_storageOffset(state, a);
long offsetb = THClTensor_storageOffset(state, b);
long offsetc = THClTensor_storageOffset(state, c);
// adjustLd(transa, transb, m, n, k, &lda, &ldb, &ldc);
clblasTranspose opa = convertTransToClblasOperation(transa);
clblasTranspose opb = convertTransToClblasOperation(transb);
clblasOrder order = orderchar == 'c' ? clblasColumnMajor : clblasRowMajor;
if( (m <= INT_MAX) && (n <= INT_MAX) && (k <= INT_MAX) && (lda <= INT_MAX) && (ldb <= INT_MAX) && (ldc <= INT_MAX) )
{
int i_m = (int)m;
int i_n = (int)n;
int i_k = (int)k;
int i_lda = (int)lda;
int i_ldb = (int)ldb;
int i_ldc = (int)ldc;
cl_int err;
if( !aWrapper->isOnDevice() ) {
aWrapper->createOnDevice();
}
if( !bWrapper->isOnDevice() ) {
bWrapper->createOnDevice();
}
if( !cWrapper->isOnDevice() ) {
cWrapper->createOnDevice();
}
EasyCL *cl = cWrapper->getCl();
cl_event *event = 0;
if(state->addFinish) {
event = new cl_event();
}
err = clblasSgemm(order, opa, opb, i_m, i_n, i_k,
alpha, aWrapper->getBuffer(), offseta, i_lda,
bWrapper->getBuffer(), offsetb, i_ldb, beta,
cWrapper->getBuffer(), offsetc, i_ldc,
1, cl->queue, 0, NULL, event);
if (err != CL_SUCCESS) {
THError("clblasSgemm() failed with %d", err);
}
else {
if(state->addFinish) {
err = clWaitForEvents(1, event);
if (err != CL_SUCCESS) {
// throw runtime_error("clblasSger() failed with " + easycl::toString(err));
THError("clblasSger: wait for event failed with %d", err);
}
clReleaseEvent(*event);
delete event;
}
}
cWrapper->markDeviceDirty();
StatefulTimer::timeCheck("THClBlas_gemm END");
return;
}
THError("Clblas_gemm only supports m, n, k, lda, ldb, ldc"
"with the bound [val] <= %d", INT_MAX);
}
示例3: THClBlas_gemv
/* Level 2 */
void THClBlas_gemv(THClState *state, char trans, long m, long n, float alpha,
THClTensor *a, long lda,
THClTensor *x, long incx,
float beta,
THClTensor *y, long incy)
{
StatefulTimer::timeCheck("THClBlas_gemv START");
CLWrapper *awrapper = THClTensor_wrapper(state, a);
CLWrapper *xwrapper = THClTensor_wrapper(state, x);
CLWrapper *ywrapper = THClTensor_wrapper(state, y);
long aoffset = THClTensor_storageOffset(state, a);
long xoffset = THClTensor_storageOffset(state, x);
long yoffset = THClTensor_storageOffset(state, y);
if(n == 1)
lda = m;
clblasTranspose op = convertTransToClblasOperation(trans);
if( (m <= INT_MAX) && (n <= INT_MAX) &&
(lda > 0) && (lda <= INT_MAX) &&
(incx > 0) && (incx <= INT_MAX) &&
(incy > 0) && (incy <= INT_MAX) )
{
int i_m = (int)m;
int i_n = (int)n;
int i_lda = (int)lda;
int i_incx = (int)incx;
int i_incy = (int)incy;
cl_int err;
EasyCL *cl = ywrapper->getCl();
cl_event *event = 0;
if(state->addFinish) {
event = new cl_event();
}
err = clblasSgemv(clblasColumnMajor, op, i_m, i_n, alpha,
awrapper->getBuffer(), aoffset, i_lda,
xwrapper->getBuffer(), xoffset, i_incx,
beta,
ywrapper->getBuffer(), yoffset, i_incy,
1, cl->queue, 0, NULL, event);
if (err != CL_SUCCESS) {
THError("clblasSdot() failed with %d", err);
}
else {
if(state->addFinish) {
err = clWaitForEvents(1, event);
if (err != CL_SUCCESS) {
// throw runtime_error("clblasSger() failed with " + easycl::toString(err));
THError("clblasSger: wait for event failed with %d", err);
}
clReleaseEvent(*event);
delete event;
}
}
ywrapper->markDeviceDirty();
StatefulTimer::timeCheck("THClBlas_gemv END");
return;
}
THError("Cublas_gemv only supports m, n, lda, incx, incy"
"in the range 0 < [val] <= %d", INT_MAX);
}
示例4: THClBlas_ger
void THClBlas_ger(THClState *state, long m, long n, float alpha,
THClTensor *x, long incx,
THClTensor *y, long incy,
THClTensor *a, long lda)
{
StatefulTimer::timeCheck("THClBlas_ger START");
if(n == 1)
lda = m;
if( (m <= INT_MAX) && (n <= INT_MAX) && (lda <= INT_MAX) && (incx <= INT_MAX) && (incy <= INT_MAX) )
{
int i_m = (int)m;
int i_n = (int)n;
int i_lda = (int)lda;
int i_incx = (int)incx;
int i_incy = (int)incy;
cl_int err;
CLWrapper *xwrap = THClTensor_wrapper(state, x);
CLWrapper *ywrap = THClTensor_wrapper(state, y);
CLWrapper *awrap = THClTensor_wrapper(state, a);
long x_offset = THClTensor_storageOffset(state, x);
long y_offset = THClTensor_storageOffset(state, y);
long a_offset = THClTensor_storageOffset(state, a);
if(!awrap->isOnDevice()) {
awrap->createOnDevice();
}
EasyCL *cl = ywrap->getCl();
cl_event *event = 0;
if(state->addFinish) {
event = new cl_event();
}
err = clblasSger(clblasColumnMajor, i_m, i_n, alpha,
xwrap->getBuffer(), x_offset, i_incx,
ywrap->getBuffer(), y_offset, i_incy,
awrap->getBuffer(), a_offset, i_lda,
1, (cl->queue), 0, NULL, event);
if (err != CL_SUCCESS) {
// throw runtime_error("clblasSger() failed with " + easycl::toString(err));
THError("clblasSger() failed with %d", err);
}
else {
if(state->addFinish) {
err = clWaitForEvents(1, event);
if (err != CL_SUCCESS) {
// throw runtime_error("clblasSger() failed with " + easycl::toString(err));
THError("clblasSger: wait for event failed with %d", err);
}
clReleaseEvent(*event);
delete event;
}
}
awrap->markDeviceDirty();
StatefulTimer::timeCheck("THClBlas_ger END");
return;
}
THError("Cublas_ger only supports m, n, lda, incx, incy"
"with the bound [val] <= %d", INT_MAX);
}
示例5: THClBlas_dot
float THClBlas_dot(THClState *state, long n,
CLWrapper *xwrapper, long xoffset, long incx,
CLWrapper *ywrapper, long yoffset, long incy)
{
StatefulTimer::timeCheck("THClBlas_dot START");
if(n == 1)
{
incx = 1;
incy = 1;
}
if( (n <= INT_MAX) && (incx <= INT_MAX) && (incy <= INT_MAX) )
{
int i_n = (int)n;
int i_incx = (int)incx;
int i_incy = (int)incy;
float result;
cl_int err;
EasyCL *cl = ywrapper->getCl();
CLWrapper *resultWrapper = cl->wrap( 1, &result );
float *scratch = new float[i_n];
CLWrapper *scratchWrapper = cl->wrap(i_n, scratch);
scratchWrapper->createOnDevice();
resultWrapper->createOnDevice();
cl_event *event = 0;
// if(state->addFinish) {
event = new cl_event();
// }
err = clblasSdot( i_n, resultWrapper->getBuffer(), 0,
xwrapper->getBuffer(), xoffset, i_incx,
ywrapper->getBuffer(), yoffset, i_incy,
scratchWrapper->getBuffer(),
1, cl->queue, 0, NULL, event);
if (err != CL_SUCCESS) {
THError("clblasSdot() failed with %d", err);
}
else {
// if(state->addFinish) {
err = clWaitForEvents(1, event);
if (err != CL_SUCCESS) {
// throw runtime_error("clblasSger() failed with " + easycl::toString(err));
THError("clblasSger: wait for event failed with %d", err);
}
clReleaseEvent(*event);
delete event;
// }
}
// TODO: NOT copy to host here, use pointtensor
resultWrapper->copyToHost();
//resultWrapper->markDeviceDirty();
delete resultWrapper;
delete scratchWrapper;
delete[] scratch;
StatefulTimer::timeCheck("THClBlas_dot END");
return result;
}
THError("Cublas_dot only supports n, incx and incy "
"upto signed integer limits: %d", INT_MAX);
THError("Not implemented");
return -1;
}