作为初学者一直,经过多次的上网搜索你一定会看到迈克老狼的向量加法的示例,不知道你是否和我一样,刚开始并不是很准确的知道他的add.cl写的代码的意思,源码如下:

#pragma OPENCL EXTENSION cl_amd_printf : enable
__kernel void vecadd(__global const float* a, __global const float* b, __global float* c) { int x = get_global_id(); int y = get_global_id(); int width = get_global_size(); int height = get_global_size(); if(x == && y ==) printf("%d, %d,%d,%d,%d,%d\n",get_local_size(),get_local_size(),get_local_id(), get_local_id(),get_group_id(),get_group_id()); c[x + y * width] = a[x + y * width] + b[x + y * width]; } 我们在k

这里面我把二维的这些值全部罗列出来如下:

int idx = get_global_id(0);
int idy = get_global_id(1);

uint wiWidth = get_global_size(0);
uint wiHeight = get_global_size(1);

uint gix_t = get_group_id(0);
uint giy_t = get_group_id(1);

uint num_of_blocks_x = get_num_groups(0);
uint num_of_blocks_y = get_num_groups(1);

uint lix = get_local_id(0);
uint liy = get_local_id(1);

你会奇怪为什么他的add.cl优化会这么写:

c[x + y * width] = a[x + y * width] + b[x + y * width];

下面进行分析:

add.cpp关键的代码部分如下(只罗列出部分代码):

#define width 8//256
#define height 16//256
#define NWITEMS width*height//262144 size_t globalThreads[] = {width, height};
size_t localx, localy; localx = 2;
localy = 4; size_t localThreads[] = {localx, localy}; clEnqueueNDRangeKernel( queue,
kernel,
2,
NULL,
globalThreads,
localThreads, 0, NULL, &ev);

我自己的add.cl代码如下(里面添加啦打印,以便我们可以看出结果):

   int idx = get_global_id();
int idy = get_global_id(); uint wiWidth = get_global_size();
uint wiHeight = get_global_size();
printf("Magnum Global idx = %d, idy = %d, sizeX =%d,sizeY =%d\n",idx,idy,wiWidth,wiHeight); uint gix_t = get_group_id();
uint giy_t = get_group_id();
uint num_of_blocks_x = get_num_groups();
uint num_of_blocks_y = get_num_groups(); printf("Magnum Group idx = %d, idy = %d, blockX=%d,blockY=%d\n",gix_t,gix_t,num_of_blocks_x,num_of_blocks_y); uint lix = get_local_id();
uint liy = get_local_id(); uint LocalX = get_local_size();
uint LocalY = get_local_size(); printf("Magnum Local idx = %d, idy = %d, localX=%d,localY=%d\n\n",lix,liy,LocalX,LocalY);

输出的结果如下:

Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY= Magnum Global idx = , idy = , sizeX =,sizeY =
Magnum Group idx = , idy = , blockX=,blockY=
Magnum Local idx = , idy = , localX=,localY=

从从这个结果首先能说明几个问题:

首先我们在:

  1. clEnqueueNDRangeKernel( queue, kernel, , NULL, globalThreads, localThreads, 0, NULL, &ev); 设置维度是2,否则add.cl中所有类似get_local_size(1)将只会返回一。
  2. 设置GlobaThreads 和 LocalThreads 不一定是 GlobalThreads= {8, 8}; 也可以不相等,LocalThreads也是一样。
  3. 理解opencl中的内存分布可以理解为二维数组,而且内存寻址的方向就像是:左上角(0,0)为原点,一行一行的扫描下去。
  4. WorkGroup的大小,目前我认为X,Y可以分开来理解(后面若发现错误我会及时改正) WorkGroup number(x) = GlobalThread(x)/LocalThread(x).
  5. 最小的单位是LocalX * LocalY, 然后用总的GlobalThreads按照这个单位进行分割成一个一个的组。每个二维的小单位还是一行一行的扫描过去的。目前我们的这个是8*16,你会发现总的Thread也是8*16,对应的每一个线程执行一次加法操作,有人会问可不可以不用这么多呢,用4*16个Threads,每个线程里面做两次加法动作,其实是可以的,这个原则是根据你的具体的Device来说的,当前我们说的是Device是GPU,比如你的GPU当前支持最大的线程数是1024*1024,这种情况,你不用多的,而是用少的线程来做,会降低你的效率,你需要尽可能的让Device满负荷工作这样才能达到提高运算速度。

继续分析为什么 NDRange改成二维的之后,add.cl变成:

c[x + y * width] = a[x + y * width] + b[x + y * width];

因为在CPU端每个 C[8*16],通过打印可以在这里C[x+y*width],x 最大是7,width是8,y最大是17,只有这样才能做完所有的向量相加。

使用二维NDRange workgroup的更多相关文章

  1. OpenCL 学习step by step (5) 使用二维NDRange workgroup

    http://www.cnblogs.com/mikewolf2002/archive/2012/09/07/2675634.html 在本教程中,我们使用二维NDRange来设置workgroup, ...

  2. Javascript生成二维码(QR)

    网络上已经有非常多的二维码编码和解码工具和代码,很多都是服务器端的,也就是说需要一台服务器才能提供二维码的生成.本着对服务器性能的考虑,这种小事情都让服务器去做,感觉对不住服务器,尤其是对于大流量的网 ...

  3. iOS二维码生成、识别、扫描等

    二维码扫描 前言: 最近的项目中使用到了二维码,二维码这个模块功能也完成:觉得还是有必要总结一下用来做记录.好长时间没有写二维码了都忘记在差不多了,重新拾起来还是挻快的. 二维码使用场景: 生活中有很 ...

  4. 很多人很想知道怎么扫一扫二维码就能打开网站,就能添加联系人,就能链接wifi,今天说下这些格式,明天做个demo

    有些功能部分手机不能使用,网站,通讯录,wifi基本上每个手机都可以使用. 在看之前你可以扫一扫下面几个二维码先看看效果: 1.二维码生成 网址 (URL) 包含网址的 二维码生成 是大家平时最常接触 ...

  5. 免费开源的DotNet二维码操作组件ThoughtWorks.QRCode(.NET组件介绍之四)

    在生活中有一种东西几乎已经快要成为我们的另一个电子”身份证“,那就是二维码.无论是在软件开发的过程中,还是在普通用户的日常中,几乎都离不开二维码.二维码 (dimensional barcode) , ...

  6. 基于SignalR的消息推送与二维码描登录实现

    1 概要说明 使用微信扫描登录相信大家都不会陌生吧,二维码与手机结合产生了不同应用场景,基于二维码的应用更是比较广泛.为了满足ios.android客户端与web短信平台的结合,特开发了基于Singl ...

  7. 微信小程序的机会在于重新理解群组与二维码

    历时一年,唯一一个尚未发布就获得Pony Ma与Allen Zhang站台的产品:微信小程序,将于2017年1月9日正式上线了.我很期待.唯一要警惕的是:防止长考出臭棋. 在上线前夕,我对于如何借助小 ...

  8. javaScript生成二维码(支持中文,生成logo)

    资料搜索 选择star最多的两个 第一个就是用的比较多的jquery.qrcode.js(但不支持中文,不能带logo)啦,第二个支持ie6+,支持中文,根据第二个源代码,使得,jquery.qrco ...

  9. 微信小程序二维码推广统计

    微信小程序可以通过生成带参数的二维码,那么这个参数是可以通过APP的页面进行监控的 这样就可以统计每个二维码的推广效果. 今天由好推二维码推出的小程序统计工具HotApp小程序统计也推出了带参数二维码 ...

随机推荐

  1. C#中的Collections命名空间

    System.Collections命名空间包含可使用的集合类和相关的接口. 该命名空间下的.NET非泛型集合类如下所示: — System.Collections.ArrayList:数组集合类,使 ...

  2. OpenCV2学习笔记02:MSVC2013搭建OpenCV开发环境

    我这里编译的库是通过手动编译的.只是需要注意的是,手动编译一般会产生大量的文件,差不多7个多G的样子,实在是有点浪费硬盘存储呀,其实我们可以删除掉没有用的东西.因为我们在编译的时候指定了一个目录比如我 ...

  3. WinForm TreeView 三种状态

    private void treeView1_NodeMouseClick(object sender, TreeNodeMouseClickEventArgs e) { var node = e.N ...

  4. dom三个事件

    1,页面加载后 window.onload=function(){}; 2,页面(关闭)卸载后触发 window.onunload=function(){}; 3,页面关闭前触发 window.onb ...

  5. What is Windows Clustering

    A cluster is a group of independent computer systems, referred to as nodes, working together as a un ...

  6. Quartz2D学习笔记(1)

    ********************************** 简介 *************************************** Quartz2D是⼀个二维绘图引擎,同时支持 ...

  7. 第一个CUDA程序

    开始学CUDA 先写一个简单的 #include<iostream>__global__ void add( int a, int b, int *c ) { *c = a + b;}in ...

  8. PHP、JSP、.NET各自的真正优势是什么

    PHP的优势在于, 跨平台, 极易部署, 易维护, 为Web而生, 开源社区强大, 文档丰富.至于说3足鼎立, 谈不上, 全球前100万的sites中, 70%是PHP. JSP和Asp..net 也 ...

  9. 用Python和Django实现多用户博客系统——UUBlog

    又过了一周,把代码整个的优化和完善了一下,也把TBlog更名为UUBlog.这次基本是把上次的整个更新了一下具体的功能大家可以下载后自己看看说一下主要的变化增加了频道表.博客表. 功能方面主要有增加频 ...

  10. iBatis系列之三

    iBatis和Hibernate最大差别就是在于iBatis没有严格的和具体的表做关联:而是将结果集和DAO做关联. iBatis的SqlConfig.xml配置一个properties文件,其实可以 ...