/**********************************************************************
Copyright ©2014 Advanced Micro Devices, Inc. All rights reserved.
Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met:
Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer.
Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or
other materials provided with the distribution.
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY
DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
********************************************************************/
// For clarity,error checking has been omitted.
#include <CL/cl.h>
#include <string.h>
#include <stdio.h>
#include <stdlib.h>
#include <iostream>
#include <string>
#include <fstream>
#define SUCCESS 0
#define FAILURE 1
using namespace std;
/* convert the kernel file into a string */
int convertToString( const char * filename, std:: string & s)
{
size_t size;
char * str;
std:: fstream f( filename, ( std:: fstream :: in | std:: fstream :: binary ) ) ;
if ( f.is_open ( ) )
{
size_t fileSize;
f.seekg ( 0 , std:: fstream :: end ) ;
size = fileSize = ( size_t ) f.tellg ( ) ;
f.seekg ( 0 , std:: fstream :: beg ) ;
str = new char [ size+ 1 ] ;
if ( ! str)
{
f.close ( ) ;
return 0 ;
}
f.read ( str, fileSize) ;
f.close ( ) ;
str[ size] = '\0 ' ;
s = str;
delete[ ] str;
return 0 ;
}
cout<< "Error: failed to open file\n :" << filename<< endl;
return FAILURE;
}
int main( int argc, char * argv[ ] )
{
/*Step1: Getting platforms and choose an available one.*/
cl_uint numPlatforms; //the NO. of platforms
cl_platform_id platform = NULL; //the chosen platform
cl_int status = clGetPlatformIDs( 0 , NULL, & numPlatforms) ;
if ( status != CL_SUCCESS)
{
cout << "Error: Getting platforms!" << endl;
return FAILURE;
}
/*For clarity, choose the first available platform. */
if ( numPlatforms > 0 )
{
cl_platform_id
* platforms
= ( cl_platform_id
* ) malloc ( numPlatforms
* sizeof ( cl_platform_id
) ) ; status = clGetPlatformIDs( numPlatforms, platforms, NULL) ;
platform = platforms[ 0 ] ;
}
/*Step 2:Query the platform and choose the first GPU device if has one.Otherwise use the CPU as device.*/
cl_uint numDevices = 0 ;
cl_device_id * devices;
status = clGetDeviceIDs( platform, CL_DEVICE_TYPE_GPU, 0 , NULL, & numDevices) ;
if ( numDevices == 0 ) //no GPU available.
{
cout << "No GPU device available." << endl;
cout << "Choose CPU as default device." << endl;
status = clGetDeviceIDs( platform, CL_DEVICE_TYPE_CPU, 0 , NULL, & numDevices) ;
devices
= ( cl_device_id
* ) malloc ( numDevices
* sizeof ( cl_device_id
) ) ; status = clGetDeviceIDs( platform, CL_DEVICE_TYPE_CPU, numDevices, devices, NULL) ;
}
else
{
devices
= ( cl_device_id
* ) malloc ( numDevices
* sizeof ( cl_device_id
) ) ; status = clGetDeviceIDs( platform, CL_DEVICE_TYPE_GPU, numDevices, devices, NULL) ;
}
/*Step 3: Create context.*/
cl_context context = clCreateContext( NULL, 1 , devices, NULL, NULL, NULL) ;
/*Step 4: Creating command queue associate with the context.*/
/*old func. code
cl_command_queue commandQueue = clCreateCommandQueue(context, devices[0], 0, NULL);
*/
/*new func.
* cl_command_queue clCreateCommandQueueWithProperties(
cl_context context,
cl_device_id device,
const cl_queue_properties *properties,
cl_int *errcode_ret)
*/
cl_command_queue commandQueue = clCreateCommandQueueWithProperties( context, devices[ 0 ] , 0 , NULL) ;
//cl_command_queue commandQueue = clCreateCommandQueue(context, devices[0], 0, NULL);
/*Step 5: Create program object */
const char * filename = "HelloWorld_Kernel.cl" ;
string sourceStr;
status = convertToString( filename, sourceStr) ;
const char * source = sourceStr.c_str ( ) ;
size_t sourceSize
[ ] = { strlen ( source
) } ; cl_program program = clCreateProgramWithSource( context, 1 , & source, sourceSize, NULL) ;
/*Step 6: Build program. */
const char options[ ] = "-cl-std=CL2.0" ;
status = clBuildProgram( program, 1 , devices, options, NULL, NULL) ;
/*Step 7: Create kernel object */
cl_kernel kernel = clCreateKernel( program, "SVMhelloworld" , NULL) ;
/*Step 8: Initial input,output for the host and create SVM buffer*/
const char * input = "HelloWorld" ;
size_t strlength
= strlen ( input
) ; char * output
= ( char * ) malloc ( strlength
+ 1 ) ; void * inputBuffer = clSVMAlloc( context, CL_MEM_READ_WRITE, ( strlength + 1 ) * sizeof ( char ) , 0 ) ;
void * outputBuffer = clSVMAlloc( context, CL_MEM_READ_WRITE, ( strlength + 1 ) * sizeof ( char ) , 0 ) ;
status = clEnqueueSVMMap( commandQueue, CL_TRUE, CL_MAP_WRITE_INVALIDATE_REGION, inputBuffer, ( strlength + 1 ) * sizeof ( char ) , 0 , NULL, NULL) ;
memcpy ( inputBuffer
, input
, strlength
) ; cout << "input string:" << endl;
cout << input << endl;
/*test inputBuffer
cout << "inputBuffer first char:" << endl;
cout << *((char *)inputBuffer) << endl;
*/
status = clEnqueueSVMUnmap( commandQueue, inputBuffer, 0 , NULL, NULL) ;
/*Step 9: Sets Kernel arguments.*/
status = clSetKernelArgSVMPointer( kernel, 0 , ( void * ) ( inputBuffer) ) ;
status = clSetKernelArgSVMPointer( kernel, 1 , ( void * ) ( outputBuffer) ) ;
/*Step 10: Running the kernel.*/
size_t global_work_size[ 1 ] = { strlength} ;
status = clEnqueueNDRangeKernel( commandQueue, kernel, 1 , NULL, global_work_size, NULL, 0 , NULL, NULL) ;
status = clEnqueueSVMMap( commandQueue, CL_TRUE, CL_MAP_WRITE_INVALIDATE_REGION, outputBuffer, ( strlength + 1 ) * sizeof ( char ) , 0 , NULL, NULL) ;
memcpy ( output
, outputBuffer
, strlength
) ; output[ strlength] = '\0 ' ; //Add the terminal character to the end of output.
/*test if kernel works and char. are all assign to outputBuffer*/
int i;
for ( i = 0 ; i < 10 ; i++ ) {
cout << "#" << i << ":" << * ( ( ( char * ) outputBuffer) + i) << endl;
}
cout << "\n output string:" << endl;
cout << output << endl;
status = clEnqueueSVMUnmap( commandQueue, outputBuffer, 0 , NULL, NULL) ;
/*Step 12: Clean the resources.*/
clSVMFree( context, inputBuffer) ;
clSVMFree( context, outputBuffer) ;
status = clReleaseKernel( kernel) ; //Release kernel.
status = clReleaseProgram( program) ; //Release the program object.
status = clReleaseCommandQueue( commandQueue) ; //Release Command queue.
status = clReleaseContext( context) ; //Release context.
if ( output != NULL)
{
output = NULL;
}
if ( devices != NULL)
{
devices = NULL;
}
cout<< "Program passed!\n " ;
return SUCCESS;
}
/**********************************************************************
Copyright ©2014 Advanced Micro Devices, Inc. All rights reserved.

Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met:

	Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer.
	Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or
 other materials provided with the distribution.

THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
 WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY
 DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
 OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
 NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
********************************************************************/

// For clarity,error checking has been omitted.

#include <CL/cl.h>
#include <string.h>
#include <stdio.h>
#include <stdlib.h>
#include <iostream>
#include <string>
#include <fstream>

#define SUCCESS 0
#define FAILURE 1

using namespace std;

/* convert the kernel file into a string */
int convertToString(const char *filename, std::string& s)
{
	size_t size;
	char*  str;
	std::fstream f(filename, (std::fstream::in | std::fstream::binary));

	if(f.is_open())
	{
		size_t fileSize;
		f.seekg(0, std::fstream::end);
		size = fileSize = (size_t)f.tellg();
		f.seekg(0, std::fstream::beg);
		str = new char[size+1];
		if(!str)
		{
			f.close();
			return 0;
		}

		f.read(str, fileSize);
		f.close();
		str[size] = '\0';
		s = str;
		delete[] str;
		return 0;
	}
	cout<<"Error: failed to open file\n:"<<filename<<endl;
	return FAILURE;
}

int main(int argc, char* argv[])
{

	/*Step1: Getting platforms and choose an available one.*/
	cl_uint numPlatforms;	//the NO. of platforms
	cl_platform_id platform = NULL;	//the chosen platform
	cl_int	status = clGetPlatformIDs(0, NULL, &numPlatforms);
	if (status != CL_SUCCESS)
	{
		cout << "Error: Getting platforms!" << endl;
		return FAILURE;
	}

	/*For clarity, choose the first available platform. */
	if(numPlatforms > 0)
	{
		cl_platform_id* platforms = (cl_platform_id* )malloc(numPlatforms* sizeof(cl_platform_id));
		status = clGetPlatformIDs(numPlatforms, platforms, NULL);
		platform = platforms[0];
		free(platforms);
	}

	/*Step 2:Query the platform and choose the first GPU device if has one.Otherwise use the CPU as device.*/
	cl_uint				numDevices = 0;
	cl_device_id        *devices;
	status = clGetDeviceIDs(platform, CL_DEVICE_TYPE_GPU, 0, NULL, &numDevices);	
	if (numDevices == 0)	//no GPU available.
	{
		cout << "No GPU device available." << endl;
		cout << "Choose CPU as default device." << endl;
		status = clGetDeviceIDs(platform, CL_DEVICE_TYPE_CPU, 0, NULL, &numDevices);	
		devices = (cl_device_id*)malloc(numDevices * sizeof(cl_device_id));
		status = clGetDeviceIDs(platform, CL_DEVICE_TYPE_CPU, numDevices, devices, NULL);
	}
	else
	{
		devices = (cl_device_id*)malloc(numDevices * sizeof(cl_device_id));
		status = clGetDeviceIDs(platform, CL_DEVICE_TYPE_GPU, numDevices, devices, NULL);
	}
	

	/*Step 3: Create context.*/
	cl_context context = clCreateContext(NULL,1, devices,NULL,NULL,NULL);
	
	/*Step 4: Creating command queue associate with the context.*/
	/*old func. code
		cl_command_queue commandQueue = clCreateCommandQueue(context, devices[0], 0, NULL);
    	*/
	/*new func.
    	*	cl_command_queue clCreateCommandQueueWithProperties(
			cl_context context, 
			cl_device_id device, 
			const cl_queue_properties *properties, 
			cl_int *errcode_ret)
	*/
	cl_command_queue commandQueue = clCreateCommandQueueWithProperties(context, devices[0], 0, NULL);
	//cl_command_queue commandQueue = clCreateCommandQueue(context, devices[0], 0, NULL);

	/*Step 5: Create program object */
	const char *filename = "HelloWorld_Kernel.cl";
	string sourceStr;
	status = convertToString(filename, sourceStr);
	const char *source = sourceStr.c_str();
	size_t sourceSize[] = {strlen(source)};
	cl_program program = clCreateProgramWithSource(context, 1, &source, sourceSize, NULL);
	
	/*Step 6: Build program. */
	const char options[] = "-cl-std=CL2.0";
	status = clBuildProgram(program, 1,devices, options,NULL,NULL);

	/*Step 7: Create kernel object */
	cl_kernel kernel = clCreateKernel(program,"SVMhelloworld", NULL);
	
	/*Step 8: Initial input,output for the host and create SVM buffer*/
	const char *input = "HelloWorld";
	size_t strlength = strlen(input);
	char *output = (char*) malloc(strlength + 1);
	void *inputBuffer = clSVMAlloc( context, CL_MEM_READ_WRITE, (strlength + 1) * sizeof(char), 0 );
	void *outputBuffer = clSVMAlloc( context, CL_MEM_READ_WRITE, (strlength + 1) * sizeof(char), 0 );
	
	status = clEnqueueSVMMap(commandQueue, CL_TRUE, CL_MAP_WRITE_INVALIDATE_REGION, inputBuffer, (strlength + 1) * sizeof(char), 0, NULL, NULL);
	memcpy(inputBuffer,input,strlength);
	cout << "input string:" << endl;
	cout << input << endl;
	/*test inputBuffer
	cout << "inputBuffer first char:" << endl;
	cout << *((char *)inputBuffer) << endl;
	*/
	status = clEnqueueSVMUnmap(commandQueue, inputBuffer, 0, NULL, NULL);
	
	/*Step 9: Sets Kernel arguments.*/
	status = clSetKernelArgSVMPointer(kernel,0,(void *)(inputBuffer));
    	status = clSetKernelArgSVMPointer(kernel,1,(void *)(outputBuffer));
  	
	/*Step 10: Running the kernel.*/
	size_t global_work_size[1] = {strlength};
	status = clEnqueueNDRangeKernel(commandQueue, kernel, 1, NULL, global_work_size, NULL, 0, NULL, NULL);

  	status = clEnqueueSVMMap(commandQueue, CL_TRUE, CL_MAP_WRITE_INVALIDATE_REGION, outputBuffer, (strlength + 1) * sizeof(char), 0, NULL, NULL);
	memcpy(output,outputBuffer,strlength);
	output[strlength] = '\0';	//Add the terminal character to the end of output.

	/*test if kernel works and char. are all assign to outputBuffer*/
	int i;
	for(i = 0; i < 10; i++){
		cout <<"#" << i << ":" << *(((char *)outputBuffer)+i) << endl;
	}

	cout << "\noutput string:" << endl;
	cout << output << endl;

  	status = clEnqueueSVMUnmap(commandQueue, outputBuffer, 0, NULL, NULL);

	/*Step 12: Clean the resources.*/
	clSVMFree(context, inputBuffer);  
    	clSVMFree(context, outputBuffer);  
	status = clReleaseKernel(kernel);				//Release kernel.
	status = clReleaseProgram(program);				//Release the program object.
	status = clReleaseCommandQueue(commandQueue);	//Release  Command queue.
	status = clReleaseContext(context);				//Release context.

	if (output != NULL)
	{
		free(output);
		output = NULL;
	}

	if (devices != NULL)
	{
		free(devices);
		devices = NULL;
	}

	cout<<"Program passed!\n";
	return SUCCESS;
}