//__kernel void AlphaKernel(cl_mem input1, cl_mem input2, cl_mem output)__global
__kernel void AlphaKernel(__global *cl_input1, __global *cl_input2, __global *cl_output)
//__kernel void AlphaKernel(__global float *input1, __global float *input2, __global float *output)
{
	//int i;
	//int j;

	//i = get_global_id(0);
	//j = 2;
	const unsigned int gid = get_group_id(0);
	size_t i = gid;

	cl_output[i] = cl_input1[i] - cl_input2[i];
	//output[i] = input1[i] - input2[i];

	//output[1] = 10; 
	//testing = 10;

	//printf("result: %d\n", i + j);
	
	//int i = get_global_id(0);
	//cl_output[5] = cl_input1[5] - cl_input2[5];
    //const uint group_id = get_global_id(0) / get_local_size(0);
    //const uint group_size = get_local_size(0);
}
