调用任何入队命令时打开CL CL_INVALID_COMMAND_QUEUE
OpenCL CL_INVALID_COMMAND_QUEUE when calling any enqueue command
每次调用命令队列上的入队命令时,都会得到返回值CL_INVALID_COMMAND_QUEUE
。
锅炉板的东西(放在ctor中)运行得很好,但当我调用处理内核执行的函数时,它在完成排队的第一个位置就坏了。
我认为我的内核是非常正确的,因为没有任何OpenCL C编译器抛出错误(AMD用于vga卡,INTEL用于处理器)。另外,一个空内核显示了相同的错误。
也许这只是一个小面包屑导致了这个问题,但我看不出来
下面向您展示了我的构造函数,它应该可以正常工作:
std::vector<cl_platform_id> this->OCLPlatformList;
std::vector<std::vector<cl_device_id>> this->OCLDevicesList;
std::vector<cl_context> this->OCLContext;
className::ctor()
{
this->FFT_SIZE_3 = this->configuration->getFFTSize(FFT_MULT::FFT_3);
cl_int err;
this->samplesInBuffer = new std::complex<float>[this->FFT_SIZE_3]();
// query OCL Platforms
cl_uint platformCount;
err = clGetPlatformIDs(0,NULL,&platformCount);
OCLCheckErr(err);
cl_platform_id* plBuffer = new cl_platform_id[platformCount];
err = clGetPlatformIDs(platformCount,plBuffer,NULL);
OCLCheckErr(err);
this->OCLPlatformList.resize((unsigned int)platformCount);
this->OCLDevicesList.resize((unsigned int)platformCount);
this->OCLContext.resize((unsigned int)platformCount);
for(cl_uint i = 0; i < platformCount; i++)
{
this->OCLPlatformList[i] = plBuffer[i];
}
delete[] plBuffer;
// query OCL Devices
cl_uint devCount;
for(unsigned int i = 0; i < this->OCLPlatformList.size() - 1; i++)
{
err = clGetDeviceIDs(this->OCLPlatformList[i],CL_DEVICE_TYPE_ALL,0,NULL,&devCount);
OCLCheckErr(err);
cl_device_id* devBuffer = new cl_device_id[devCount];
err = clGetDeviceIDs(this->OCLPlatformList[i],CL_DEVICE_TYPE_ALL,devCount,devBuffer,NULL);
OCLCheckErr(err);
this->OCLDevicesList[i].resize((unsigned int)devCount);
std::cout << std::endl << "Platform #" << i << ": " << OCLGetPlatformName(this->OCLPlatformList[i]) << std::endl;
for(cl_uint j = 0; j < devCount; j++)
{
this->OCLDevicesList[i][j] = devBuffer[j];
std::cout << "|-- Device #" << j << ": " << OCLGetDeviceName(this->OCLDevicesList[i][j]) << std::endl;
}
std::cout << std::endl;
delete[] devBuffer;
}
// create OCL Context
cl_context_properties* cprops = new cl_context_properties[3];
cprops[0] = ;
cprops[2] = 0;
for(unsigned int i = 0; i < this->OCLPlatformList.size() - 1; i++)
{
cl_device_id* devBuffer = new cl_device_id[this->OCLDevicesList[i].size()];
unsigned int j = 0;
for(std::vector<cl_device_id>::iterator it = this->OCLDevicesList[i].begin(); it != this->OCLDevicesList[i].end(); ++it)
devBuffer[j++] = *it;
cprops[1] = (cl_context_properties)this->OCLPlatformList[i];
this->OCLContext[i] = clCreateContext(cprops,(cl_uint)this->OCLDevicesList[i].size(),devBuffer,NULL,NULL,&err);
OCLCheckErr(err);
}
delete[] cprops;
// create OCL Command Queue
cl_queue_properties qprops[] =
{
CL_QUEUE_PROPERTIES,CL_QUEUE_ON_DEVICE_DEFAULT,0
};
this->OCLComQueue = clCreateCommandQueueWithProperties(this->OCLContext[0],this->OCLDevicesList[0][0],qprops,&err);
OCLCheckErr(err);
cl_int commSize;
err = clGetCommandQueueInfo(this->OCLComQueue,CL_QUEUE_SIZE,sizeof(cl_int),&commSize,NULL);
std::cout << this->OCLComQueue << " " << (long)commSize << std::endl;
OCLCheckErr(OCLCompileKernelFromSource(this->OCLProgram,"Kkernel.cl",this->OCLContext[0],this->OCLDevicesList[0][0],true));
this->kernel = clCreateKernel(this->OCLProgram,"Kkernel",&err);
OCLCheckErr(err);
// create OCL Buffer
//std::complex<float> this->BufferA[this->sizeA];
this->BufferACL = clCreateBuffer(this->OCLContext[0],(CL_MEM_READ_WRITE | CL_MEM_COPY_HOST_PTR),
(this->sizeA * sizeof(std::complex<float>)),this->BufferA,&err);
OCLCheckErr(err);
//std::complex<float> this->BufferB[this->sizeB * this->k];
this->BufferBCL = clCreateBuffer(this->OCLContext[0],(CL_MEM_READ_WRITE | CL_MEM_COPY_HOST_PTR),
(this->sizeB * this->k * sizeof(std::complex<float>)),BufferB,&err);
OCLCheckErr(err);
//std::complex<float> this->BufferB[this->l * this->k];
this->BufferCCL = clCreateBuffer(this->OCLContext[0],(CL_MEM_WRITE_ONLY | CL_MEM_COPY_HOST_PTR),
(this->l * this->k * sizeof(std::complex<float>)),this->BufferC,&err);
OCLCheckErr(err);
err = clSetKernelArg(this->kernel,0,sizeof(this->BufferACL),(void*)&this->BufferACL);
OCLCheckErr(err);
err = clSetKernelArg(this->kernel,1,sizeof(this->BufferBCL),(void*)&this->BufferBCL);
OCLCheckErr(err);
err = clSetKernelArg(this->kernel,2,sizeof(this->BufferCCL),(void*)&this->BufferCCL);
OCLCheckErr(err);
err = clSetKernelArg(this->kernel,3,sizeof(unsigned int),(void*)&this->k);
OCLCheckErr(err);
}
这是应该处理内核执行的函数的第一部分。如果我注释掉内存缓冲区的排队,它在内核排队时失败:
void className::func1()
{
long c = this->k - 1;
for(std::list<std::complex<float>>::iterator it = this->sampleHistBuffer.begin(); it != this->sampleHistBuffer.end(); ++it)
{
cl_int err;
cl_event event;
clFinish(this->OCLComQueue);
OCLCheckErr(err);
err = clEnqueueWriteBuffer(this->OCLComQueue,this->BufferACL,CL_TRUE,0,(this->k * sizeof(std::complex<float>)),this->BufferA,0,NULL,&event);
OCLCheckErr(err);
cl_int state;
do
{
clGetEventInfo(event,CL_EVENT_COMMAND_EXECUTION_STATUS,sizeof(state),&state,NULL);
if(state < 0)
throw 11;
}
while(state >= CL_COMPLETE);
size_t global_item_size = this->k * this->l;
size_t local_item_size = this->k;
err = clEnqueueNDRangeKernel(this->OCLComQueue,this->kernel,1,NULL,&global_item_size,&local_item_size,0,NULL,&event);
OCLCheckErr(err);
do
{
clGetEventInfo(event,CL_EVENT_COMMAND_EXECUTION_STATUS,sizeof(state),&state,NULL);
if(state < 0)
throw 11;
}
while(state >= CL_COMPLETE);
/*...*/
}
最后但同样重要的是,这是内核的来源。它在l个工作组上对k个工作项执行乘法运算:
float2 cmult(float2 A, float2 B)
{
float2 ret;
ret.x = A.x * B.x;
ret.y = A.y * B.y;
return ret;
}
#pragma OPENCL EXTENSION cl_khr_byte_addressable_store : enable
__kernel void Kkernel(__global float2* BufferA, __global float2* BufferB, __global float2* BufferC, unsigned int k)
{
size_t sampleWrkGp = get_group_id(0);
size_t sampleWrkId = get_local_id(0);
BufferC[(sampleWrkId * k) + sampleWrkId] = cmult(BufferA[sampleWrkId],BufferB[(sampleWrkId * k) + sampleWrkId]);
}
如果有一些未描述的功能(如OCLCheckErr()
),您可以确保它们是安全的,而不是问题所在。
看起来您正在创建一个设备上的命令队列(CL_queue_on_device_DEFAULT),然后尝试使用它将来自主机的命令排入队列。您只能从设备端使用设备端命令队列。对主机端队列使用常规命令队列(clCreateCommandQueue)。
相关文章:
- 为cl.exe(Visual Studio代码)指定命令行C++版本
- 当我编译webrtc服务器时,Windows上只支持clang-cl
- 如何解决"invalid conversion from 'char' to 'const char*'"
- 如何处理 c++ 中类实现中的"invalid use of non-static data member"?
- C++ "error: invalid use of void expression"
- 收到错误"invalid use of non-static data member 'stu::n' "
- Poloniex API "Invalid command" c++ libcurl
- 使用 cl 构建代码并连接到 sqlite 库
- C++模板错误:"invalid explicitly-specified argument for template parameter"
- SDL_CreateTextureFromSurface() "Invalid texture"错误?
- C++ "Invalid use of 'this' in non-member function" ,
- 为什么gmp会在这里与"invalid next size"重新定位一起崩溃?
- MSYS2 MinGW64 在 Windows 上构建 GMP/MPFR 作为静态库,并将它们链接到使用 CL 编译的
- 继承类时"invalid use of incomplete type ‘class tree_node_t’"
- 为什么我会"Invalid read of size 8"?(瓦尔格林德)
- "fast"或"normal"在"free(): invalid next size (fast)"中是什么意思?
- 如何在Arduino程序中解决"invalid operands of types"?
- NMAKE:致命错误 U1077:cl.exe 和 nmake.exe 返回代码'0x2'
- 如何'Invalid conversion'和'no match for operator'更正这些 c++ 错误
- Clang-CL 警告 strnicmp 已弃用,请使用 ISO C 并C++符合标准的名称_strnicmp