Added a compilation routine, probably will abstract all this out into

it's own class / function. Added a small kernel that I got from a tutorial
to test the compilers error codes. Added a small notes file with error
codes. Added some error checking for the error codes
master
mitchellhansen 9 years ago
parent 49817f94b7
commit d2b79ceec3

@ -0,0 +1,32 @@
__constant sampler_t sampler =
CLK_NORMALIZED_COORDS_FALSE
| CLK_ADDRESS_CLAMP_TO_EDGE
| CLK_FILTER_NEAREST;
__constant int FILTER_SIZE = 10;
float FilterValue (__constant const float* filterWeights,
const int x, const int y)
{
return filterWeights[(x+FILTER_SIZE) + (y+FILTER_SIZE)*(FILTER_SIZE*2 + 1)];
}
__kernel void Filter (
__read_only image2d_t input,
__constant float* filterWeights,
__write_only image2d_t output)
{
const int2 pos = {get_global_id(0), get_global_id(1)};
float4 sum = (float4)(0.0f);
for(int y = -FILTER_SIZE; y <= FILTER_SIZE; y++) {
for(int x = -FILTER_SIZE; x <= FILTER_SIZE; x++) {
sum += FilterValue(filterWeights, x, y)
* read_imagef(input, sampler, pos + (int2)(x,y));
}
}
write_imagef (output, (int2)(pos.x, pos.y), sum);
}

@ -0,0 +1,47 @@
CL_SUCCESS 0
CL_DEVICE_NOT_FOUND -1
CL_DEVICE_NOT_AVAILABLE -2
CL_COMPILER_NOT_AVAILABLE -3
CL_MEM_OBJECT_ALLOCATION_FAILURE -4
CL_OUT_OF_RESOURCES -5
CL_OUT_OF_HOST_MEMORY -6
CL_PROFILING_INFO_NOT_AVAILABLE -7
CL_MEM_COPY_OVERLAP -8
CL_IMAGE_FORMAT_MISMATCH -9
CL_IMAGE_FORMAT_NOT_SUPPORTED -10
CL_BUILD_PROGRAM_FAILURE -11
CL_MAP_FAILURE -12
CL_INVALID_VALUE -30
CL_INVALID_DEVICE_TYPE -31
CL_INVALID_PLATFORM -32
CL_INVALID_DEVICE -33
CL_INVALID_CONTEXT -34
CL_INVALID_QUEUE_PROPERTIES -35
CL_INVALID_COMMAND_QUEUE -36
CL_INVALID_HOST_PTR -37
CL_INVALID_MEM_OBJECT -38
CL_INVALID_IMAGE_FORMAT_DESCRIPTOR -39
CL_INVALID_IMAGE_SIZE -40
CL_INVALID_SAMPLER -41
CL_INVALID_BINARY -42
CL_INVALID_BUILD_OPTIONS -43
CL_INVALID_PROGRAM -44
CL_INVALID_PROGRAM_EXECUTABLE -45
CL_INVALID_KERNEL_NAME -46
CL_INVALID_KERNEL_DEFINITION -47
CL_INVALID_KERNEL -48
CL_INVALID_ARG_INDEX -49
CL_INVALID_ARG_VALUE -50
CL_INVALID_ARG_SIZE -51
CL_INVALID_KERNEL_ARGS -52
CL_INVALID_WORK_DIMENSION -53
CL_INVALID_WORK_GROUP_SIZE -54
CL_INVALID_WORK_ITEM_SIZE -55
CL_INVALID_GLOBAL_OFFSET -56
CL_INVALID_EVENT_WAIT_LIST -57
CL_INVALID_EVENT -58
CL_INVALID_OPERATION -59
CL_INVALID_GL_OBJECT -60
CL_INVALID_BUFFER_SIZE -61
CL_INVALID_MIP_LEVEL -62

@ -6,6 +6,8 @@
#include <Map.h>
#include "Curses.h"
# include <GL/glew.h>
#include <fstream>
#include <sstream>
#ifdef linux
@ -18,19 +20,37 @@
# include <OpenGL/OpenGL.h>
# include <OpenCL/opencl.h>
#endif
const int WINDOW_X = 150;
const int WINDOW_Y = 150;
std::string read_file(std::string file_name){
std::ifstream input_file(file_name);
int main(){
if (!input_file.is_open()){
std::cout << file_name << " could not be opened" << std::endl;
return nullptr;
}
// ===================================================================== //
// ==== Opencl
std::stringstream buf;
buf << input_file.rdbuf();
return buf.str();
}
int main(){
char buffer[256];
char *val = getcwd(buffer, sizeof(buffer));
if (val) {
std::cout << buffer << std::endl;
}
// ===================================================================== //
// ==== Opencl setup
int error = 0;
// Get the number of platforms
@ -44,8 +64,7 @@ int main(){
// get the number of devices, fetch them, choose the first one
cl_uint deviceIdCount = 0;
std::vector<cl_device_id> deviceIds (deviceIdCount);
std::vector<cl_device_id> deviceIds;
// Try to get a GPU first
error = clGetDeviceIDs (platformIds [0], CL_DEVICE_TYPE_GPU, 0, nullptr,
&deviceIdCount);
@ -53,12 +72,18 @@ int main(){
if (deviceIdCount == 0) {
std::cout << "couldn't aquire a GPU, falling back to CPU" << std::endl;
error = clGetDeviceIDs(platformIds[0], CL_DEVICE_TYPE_CPU, 0, nullptr, &deviceIdCount);
deviceIds.resize(deviceIdCount);
error = clGetDeviceIDs(platformIds[0], CL_DEVICE_TYPE_CPU, deviceIdCount, deviceIds.data(), NULL);
} else {
std::cout << "aquired GPU cl target" << std::endl;
deviceIds.resize(deviceIdCount);
clGetDeviceIDs (platformIds[0], CL_DEVICE_TYPE_GPU, deviceIdCount, deviceIds.data (), nullptr);
}
if (error != 0){
std::cout << "Err: clGetDeviceIDs returned: " << error << std::endl;
return error;
}
// Hurray for standards!
// Setup the context properties to grab the current GL context
@ -98,11 +123,62 @@ int main(){
&error
);
if (error != 0){
std::cout << "Err: clCreateContext returned: " << error << std::endl;
return error;
}
// And the cl command queue
auto commandQueue = clCreateCommandQueue(context, deviceIds[0], 0, NULL);
auto commandQueue = clCreateCommandQueue(context, deviceIds[0], 0, &error);
if (error != 0){
std::cout << "Err: clCreateCommandQueue returned: " << error << std::endl;
return error;
}
// At this point the shared GL/CL context is up and running
// ====================================================================== //
// ========== Kernel setup & compilation
// Load in the kernel, and c stringify it
std::string kernel_source;
kernel_source = read_file("../kernels/kernel.txt");
const char* kernel_source_c_str = kernel_source.c_str();
size_t kernel_source_size = strlen(kernel_source_c_str);
// Load the source into CL's data structure
cl_program kernel_program = clCreateProgramWithSource(
context, 1,
&kernel_source_c_str,
&kernel_source_size, &error
);
if (error != 0){
std::cout << "Err: clCreateProgramWithSource returned: " << error << std::endl;
return error;
}
// Try and build the program
error = clBuildProgram(kernel_program, 1, &deviceIds[0], NULL, NULL, NULL);
// Check to see if it errored out
if (error == CL_BUILD_PROGRAM_FAILURE){
// Get the size of the queued log
size_t log_size;
clGetProgramBuildInfo(kernel_program, deviceIds[0], CL_PROGRAM_BUILD_LOG, 0, NULL, &log_size);
char *log = new char[log_size];
// Grab the log
clGetProgramBuildInfo(kernel_program, deviceIds[0], CL_PROGRAM_BUILD_LOG, log_size, log, NULL);
std::cout << "Err: clBuildProgram returned: " << error << std::endl;
std::cout << log << std::endl;
return error;
}
};

Loading…
Cancel
Save