You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
3249 lines
130 KiB
3249 lines
130 KiB
//
|
|
// Copyright (c) 2017 The Khronos Group Inc.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
//
|
|
#include "testBase.h"
|
|
#if defined(_WIN32)
|
|
#include <time.h>
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
#include <sys/time.h>
|
|
#include <unistd.h>
|
|
#endif
|
|
#include "harness/conversions.h"
|
|
|
|
#define MAX_LINE_SIZE_IN_PROGRAM 1024
|
|
#define MAX_LOG_SIZE_IN_PROGRAM 2048
|
|
|
|
const char *sample_kernel_start =
|
|
"__kernel void sample_test(__global float *src, __global int *dst)\n"
|
|
"{\n"
|
|
" float temp;\n"
|
|
" int tid = get_global_id(0);\n";
|
|
|
|
const char *sample_kernel_end = "}\n";
|
|
|
|
const char *sample_kernel_lines[] = {
|
|
"dst[tid] = src[tid];\n",
|
|
"dst[tid] = src[tid] * 3.f;\n",
|
|
"temp = src[tid] / 4.f;\n",
|
|
"dst[tid] = dot(temp,src[tid]);\n",
|
|
"dst[tid] = dst[tid] + temp;\n" };
|
|
|
|
/* I compile and link therefore I am. Robert Ioffe */
|
|
/* The following kernels are used in testing Improved Compilation and Linking feature */
|
|
|
|
const char *simple_kernel =
|
|
"__kernel void\n"
|
|
"CopyBuffer(\n"
|
|
" __global float* src,\n"
|
|
" __global float* dst )\n"
|
|
"{\n"
|
|
" int id = (int)get_global_id(0);\n"
|
|
" dst[id] = src[id];\n"
|
|
"}\n";
|
|
|
|
const char *simple_kernel_with_defines =
|
|
"__kernel void\n"
|
|
"CopyBuffer(\n"
|
|
" __global float* src,\n"
|
|
" __global float* dst )\n"
|
|
"{\n"
|
|
" int id = (int)get_global_id(0);\n"
|
|
" float temp = src[id] - 42;\n"
|
|
" dst[id] = FIRST + temp + SECOND;\n"
|
|
"}\n";
|
|
|
|
const char *simple_kernel_template =
|
|
"__kernel void\n"
|
|
"CopyBuffer%d(\n"
|
|
" __global float* src,\n"
|
|
" __global float* dst )\n"
|
|
"{\n"
|
|
" int id = (int)get_global_id(0);\n"
|
|
" dst[id] = src[id];\n"
|
|
"}\n";
|
|
|
|
const char *composite_kernel_start =
|
|
"__kernel void\n"
|
|
"CompositeKernel(\n"
|
|
" __global float* src,\n"
|
|
" __global float* dst )\n"
|
|
"{\n";
|
|
|
|
const char *composite_kernel_end = "}\n";
|
|
|
|
const char *composite_kernel_template =
|
|
" CopyBuffer%d(src, dst);\n";
|
|
|
|
const char *composite_kernel_extern_template =
|
|
"extern __kernel void\n"
|
|
"CopyBuffer%d(\n"
|
|
" __global float* src,\n"
|
|
" __global float* dst );\n";
|
|
|
|
const char *another_simple_kernel =
|
|
"extern __kernel void\n"
|
|
"CopyBuffer(\n"
|
|
" __global float* src,\n"
|
|
" __global float* dst );\n"
|
|
"__kernel void\n"
|
|
"AnotherCopyBuffer(\n"
|
|
" __global float* src,\n"
|
|
" __global float* dst )\n"
|
|
"{\n"
|
|
" CopyBuffer(src, dst);\n"
|
|
"}\n";
|
|
|
|
const char* simple_header =
|
|
"extern __kernel void\n"
|
|
"CopyBuffer(\n"
|
|
" __global float* src,\n"
|
|
" __global float* dst );\n";
|
|
|
|
const char* simple_header_name = "simple_header.h";
|
|
|
|
const char* another_simple_kernel_with_header =
|
|
"#include \"simple_header.h\"\n"
|
|
"__kernel void\n"
|
|
"AnotherCopyBuffer(\n"
|
|
" __global float* src,\n"
|
|
" __global float* dst )\n"
|
|
"{\n"
|
|
" CopyBuffer(src, dst);\n"
|
|
"}\n";
|
|
|
|
const char* header_name_templates[4] = { "simple_header%d.h",
|
|
"foo/simple_header%d.h",
|
|
"foo/bar/simple_header%d.h",
|
|
"foo/bar/baz/simple_header%d.h"};
|
|
|
|
const char* include_header_name_templates[4] = { "#include \"simple_header%d.h\"\n",
|
|
"#include \"foo/simple_header%d.h\"\n",
|
|
"#include \"foo/bar/simple_header%d.h\"\n",
|
|
"#include \"foo/bar/baz/simple_header%d.h\"\n"};
|
|
|
|
const char* compile_extern_var = "extern constant float foo;\n";
|
|
const char* compile_extern_struct = "extern constant struct bar bart;\n";
|
|
const char* compile_extern_function = "extern int baz(int, int);\n";
|
|
|
|
const char* compile_static_var = "static constant float foo = 2.78;\n";
|
|
const char* compile_static_struct = "static constant struct bar {float x, y, z, r; int color; } foo = {3.14159};\n";
|
|
const char* compile_static_function = "static int foo(int x, int y) { return x*x + y*y; }\n";
|
|
|
|
const char* compile_regular_var = "constant float foo = 4.0f;\n";
|
|
const char* compile_regular_struct = "constant struct bar {float x, y, z, r; int color; } foo = {0.f, 0.f, 0.f, 0.f, 0};\n";
|
|
const char* compile_regular_function = "int foo(int x, int y) { return x*x + y*y; }\n";
|
|
|
|
const char* link_static_var_access = // use with compile_static_var
|
|
"extern constant float foo;\n"
|
|
"float access_foo() { return foo; }\n";
|
|
|
|
const char* link_static_struct_access = // use with compile_static_struct
|
|
"extern constant struct bar{float x, y, z, r; int color; } foo;\n"
|
|
"struct bar access_foo() {return foo; }\n";
|
|
|
|
const char* link_static_function_access = // use with compile_static_function
|
|
"extern int foo(int, int);\n"
|
|
"int access_foo() { int blah = foo(3, 4); return blah + 5; }\n";
|
|
|
|
int test_large_single_compile(cl_context context, cl_device_id deviceID, unsigned int numLines)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
const char **lines;
|
|
unsigned int numChoices, i;
|
|
MTdata d;
|
|
|
|
/* First, allocate the array for our line pointers */
|
|
lines = (const char **)malloc( numLines * sizeof( const char * ) );
|
|
if (lines == NULL) {
|
|
log_error( "ERROR: Unable to allocate lines array with %d lines! (in %s:%d)\n", numLines, __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
|
|
/* First and last lines are easy */
|
|
lines[ 0 ] = sample_kernel_start;
|
|
lines[ numLines - 1 ] = sample_kernel_end;
|
|
|
|
numChoices = sizeof( sample_kernel_lines ) / sizeof( sample_kernel_lines[ 0 ] );
|
|
|
|
/* Fill the rest with random lines to hopefully prevent much optimization */
|
|
d = init_genrand( gRandomSeed );
|
|
for( i = 1; i < numLines - 1; i++ )
|
|
{
|
|
lines[ i ] = sample_kernel_lines[ genrand_int32(d) % numChoices ];
|
|
}
|
|
free_mtdata(d); d = NULL;
|
|
|
|
/* Try to create a program with these lines */
|
|
error = create_single_kernel_helper_create_program(context, &program, numLines, lines);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create long test program with %d lines! (%s in %s:%d)", numLines, IGetErrorString( error ), __FILE__, __LINE__ );
|
|
free( lines );
|
|
if (program != NULL)
|
|
{
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release a program object" );
|
|
}
|
|
return -1;
|
|
}
|
|
|
|
/* Build it */
|
|
error = clBuildProgram( program, 1, &deviceID, NULL, NULL, NULL );
|
|
test_error( error, "Unable to build a long program" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release a program object" );
|
|
|
|
free( lines );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_large_compile(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
unsigned int toTest[] = { 64, 128, 256, 512, 1024, 2048, 4096, 0 }; //8192, 16384, 32768, 0 };
|
|
unsigned int i;
|
|
|
|
log_info( "Testing large compiles...this might take awhile...\n" );
|
|
|
|
for( i = 0; toTest[ i ] != 0; i++ )
|
|
{
|
|
log_info( " %d...\n", toTest[ i ] );
|
|
|
|
#if defined(_WIN32)
|
|
clock_t start = clock();
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
timeval time1, time2;
|
|
gettimeofday(&time1, NULL);
|
|
#endif
|
|
|
|
if( test_large_single_compile( context, deviceID, toTest[ i ] ) != 0 )
|
|
{
|
|
log_error( "ERROR: long program test failed for %d lines! (in %s:%d)\n", toTest[ i ], __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
|
|
#if defined(_WIN32)
|
|
clock_t end = clock();
|
|
log_perf( (float)( end - start ) / (float)CLOCKS_PER_SEC, false, "clock() time in secs", "%d lines", toTest[i] );
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
gettimeofday(&time2, NULL);
|
|
log_perf( (float)(float)(time2.tv_sec - time1.tv_sec) + 1.0e-6 * (time2.tv_usec - time1.tv_usec) , false, "wall time in secs", "%d lines", toTest[i] );
|
|
#endif
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int verifyCopyBuffer(cl_context context, cl_command_queue queue, cl_kernel kernel);
|
|
|
|
#if defined(__APPLE__) || defined(__linux)
|
|
#define _strdup strdup
|
|
#endif
|
|
|
|
int test_large_multi_file_library(cl_context context, cl_device_id deviceID, cl_command_queue queue, unsigned int numLines)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
cl_program *simple_kernels;
|
|
const char **lines;
|
|
unsigned int i;
|
|
char buffer[MAX_LINE_SIZE_IN_PROGRAM];
|
|
|
|
simple_kernels = (cl_program*)malloc(numLines*sizeof(cl_program));
|
|
if (simple_kernels == NULL) {
|
|
log_error( "ERROR: Unable to allocate kernels array with %d kernels! (in %s:%d)\n", numLines, __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
/* First, allocate the array for our line pointers */
|
|
lines = (const char **)malloc( (2*numLines + 2) * sizeof( const char * ) );
|
|
if (lines == NULL) {
|
|
free(simple_kernels);
|
|
log_error( "ERROR: Unable to allocate lines array with %d lines! (in %s:%d)\n", (2*numLines + 2), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
for( i = 0; i < numLines; i++)
|
|
{
|
|
sprintf(buffer, composite_kernel_extern_template, i);
|
|
lines[i] = _strdup(buffer);
|
|
}
|
|
/* First and last lines are easy */
|
|
lines[ numLines ] = composite_kernel_start;
|
|
lines[ 2* numLines + 1] = composite_kernel_end;
|
|
|
|
/* Fill the rest with templated kernels */
|
|
for( i = numLines + 1; i < 2* numLines + 1; i++ )
|
|
{
|
|
sprintf(buffer, composite_kernel_template, i - numLines - 1);
|
|
lines[ i ] = _strdup(buffer);
|
|
}
|
|
|
|
/* Try to create a program with these lines */
|
|
error = create_single_kernel_helper_create_program(context, &program, 2 * numLines + 2, lines);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create long test program with %d lines! (%s) (in %s:%d)\n", numLines, IGetErrorString( error ), __FILE__, __LINE__ );
|
|
free( simple_kernels );
|
|
for( i = 0; i < numLines; i++)
|
|
{
|
|
free( (void*)lines[i] );
|
|
free( (void*)lines[i+numLines+1] );
|
|
}
|
|
free( lines );
|
|
if (program != NULL)
|
|
{
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
}
|
|
|
|
return -1;
|
|
}
|
|
|
|
/* Compile it */
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
/* Create and compile templated kernels */
|
|
for( i = 0; i < numLines; i++)
|
|
{
|
|
sprintf(buffer, simple_kernel_template, i);
|
|
const char* kernel_source = _strdup(buffer);
|
|
simple_kernels[i] = clCreateProgramWithSource( context, 1, &kernel_source, NULL, &error );
|
|
if( simple_kernels[i] == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create long test program with %d lines! (%s) (in %s:%d)\n", numLines, IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
/* Compile it */
|
|
error = clCompileProgram(simple_kernels[i], 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
free((void*)kernel_source);
|
|
}
|
|
|
|
/* Create library out of compiled templated kernels */
|
|
cl_program my_newly_minted_library = clLinkProgram(context, 1, &deviceID, "-create-library", numLines, simple_kernels, NULL, NULL, &error);
|
|
test_error( error, "Unable to create a multi-line library" );
|
|
|
|
/* Link the program that calls the kernels and the library that contains them */
|
|
cl_program programs[2] = { program, my_newly_minted_library };
|
|
cl_program my_newly_linked_program = clLinkProgram(context, 1, &deviceID, NULL, 2, programs, NULL, NULL, &error);
|
|
test_error( error, "Unable to link a program with a library" );
|
|
|
|
// Create the composite kernel
|
|
cl_kernel kernel = clCreateKernel(my_newly_linked_program, "CompositeKernel", &error);
|
|
test_error( error, "Unable to create a composite kernel" );
|
|
|
|
// Run the composite kernel and verify the results
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
for( i = 0; i < numLines; i++)
|
|
{
|
|
free( (void*)lines[i] );
|
|
free( (void*)lines[i+numLines+1] );
|
|
}
|
|
free( lines );
|
|
|
|
for(i = 0; i < numLines; i++)
|
|
{
|
|
error = clReleaseProgram( simple_kernels[i] );
|
|
test_error( error, "Unable to release program object" );
|
|
}
|
|
free( simple_kernels );
|
|
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseProgram( my_newly_minted_library );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_multi_file_libraries(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
unsigned int toTest[] = { 2, 4, 8, 16, 32, 64, 128, 256, 0 }; // 512, 1024, 2048, 4096, 8192, 16384, 32768, 0 };
|
|
unsigned int i;
|
|
|
|
log_info( "Testing multi-file libraries ...this might take awhile...\n" );
|
|
|
|
for( i = 0; toTest[ i ] != 0; i++ )
|
|
{
|
|
log_info( " %d...\n", toTest[ i ] );
|
|
|
|
#if defined(_WIN32)
|
|
clock_t start = clock();
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
timeval time1, time2;
|
|
gettimeofday(&time1, NULL);
|
|
#endif
|
|
|
|
if( test_large_multi_file_library( context, deviceID, queue, toTest[ i ] ) != 0 )
|
|
{
|
|
log_error( "ERROR: multi-file library program test failed for %d lines! (in %s:%d)\n\n", toTest[ i ], __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
#if defined(_WIN32)
|
|
clock_t end = clock();
|
|
log_perf( (float)( end - start ) / (float)CLOCKS_PER_SEC, false, "clock() time in secs", "%d lines", toTest[i] );
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
gettimeofday(&time2, NULL);
|
|
log_perf( (float)(float)(time2.tv_sec - time1.tv_sec) + 1.0e-6 * (time2.tv_usec - time1.tv_usec) , false, "wall time in secs", "%d lines", toTest[i] );
|
|
#endif
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_large_multiple_embedded_headers(cl_context context, cl_device_id deviceID, cl_command_queue queue, unsigned int numLines)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
cl_program *simple_kernels;
|
|
cl_program *headers;
|
|
const char **header_names;
|
|
const char **lines;
|
|
unsigned int i;
|
|
char buffer[MAX_LINE_SIZE_IN_PROGRAM];
|
|
|
|
simple_kernels = (cl_program*)malloc(numLines*sizeof(cl_program));
|
|
if (simple_kernels == NULL) {
|
|
log_error( "ERROR: Unable to allocate simple_kernels array with %d lines! (in %s:%d)\n", numLines, __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
headers = (cl_program*)malloc(numLines*sizeof(cl_program));
|
|
if (headers == NULL) {
|
|
log_error( "ERROR: Unable to allocate headers array with %d lines! (in %s:%d)\n", numLines, __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
/* First, allocate the array for our line pointers */
|
|
header_names = (const char**)malloc( numLines*sizeof( const char * ) );
|
|
if (header_names == NULL) {
|
|
log_error( "ERROR: Unable to allocate header_names array with %d lines! (in %s:%d)\n", numLines, __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
lines = (const char **)malloc( (2*numLines + 2)*sizeof( const char * ) );
|
|
if (lines == NULL) {
|
|
log_error( "ERROR: Unable to allocate lines array with %d lines! (in %s:%d)\n", (2*numLines + 2), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
for( i = 0; i < numLines; i++)
|
|
{
|
|
sprintf(buffer, include_header_name_templates[i % 4], i);
|
|
lines[i] = _strdup(buffer);
|
|
sprintf(buffer, header_name_templates[i % 4], i);
|
|
header_names[i] = _strdup(buffer);
|
|
|
|
sprintf(buffer, composite_kernel_extern_template, i);
|
|
const char* line = _strdup(buffer);
|
|
error = create_single_kernel_helper_create_program(context, &headers[i], 1, &line);
|
|
if( headers[i] == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple header program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
}
|
|
/* First and last lines are easy */
|
|
lines[ numLines ] = composite_kernel_start;
|
|
lines[ 2* numLines + 1 ] = composite_kernel_end;
|
|
|
|
/* Fill the rest with templated kernels */
|
|
for( i = numLines + 1; i < 2* numLines + 1; i++ )
|
|
{
|
|
sprintf(buffer, composite_kernel_template, i - numLines - 1);
|
|
lines[ i ] = _strdup(buffer);
|
|
}
|
|
|
|
/* Try to create a program with these lines */
|
|
error = create_single_kernel_helper_create_program(context, &program, 2 * numLines + 2, lines);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create long test program with %d lines! (%s) (in %s:%d)\n", numLines, IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
/* Compile it */
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, numLines, headers, header_names, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
/* Create and compile templated kernels */
|
|
for( i = 0; i < numLines; i++)
|
|
{
|
|
sprintf(buffer, simple_kernel_template, i);
|
|
const char* kernel_source = _strdup(buffer);
|
|
error = create_single_kernel_helper_create_program(context, &simple_kernels[i], 1, &kernel_source);
|
|
if( simple_kernels[i] == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create long test program with %d lines! (%s) (in %s:%d)\n", numLines, IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
/* Compile it */
|
|
error = clCompileProgram(simple_kernels[i], 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
free((void*)kernel_source);
|
|
}
|
|
|
|
/* Create library out of compiled templated kernels */
|
|
cl_program my_newly_minted_library = clLinkProgram(context, 1, &deviceID, "-create-library", numLines, simple_kernels, NULL, NULL, &error);
|
|
test_error( error, "Unable to create a multi-line library" );
|
|
|
|
/* Link the program that calls the kernels and the library that contains them */
|
|
cl_program programs[2] = { program, my_newly_minted_library };
|
|
cl_program my_newly_linked_program = clLinkProgram(context, 1, &deviceID, NULL, 2, programs, NULL, NULL, &error);
|
|
test_error( error, "Unable to link a program with a library" );
|
|
|
|
// Create the composite kernel
|
|
cl_kernel kernel = clCreateKernel(my_newly_linked_program, "CompositeKernel", &error);
|
|
test_error( error, "Unable to create a composite kernel" );
|
|
|
|
// Run the composite kernel and verify the results
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
for( i = 0; i < numLines; i++)
|
|
{
|
|
free( (void*)lines[i] );
|
|
free( (void*)header_names[i] );
|
|
}
|
|
for( i = numLines + 1; i < 2* numLines + 1; i++ )
|
|
{
|
|
free( (void*)lines[i] );
|
|
}
|
|
free( lines );
|
|
free( header_names );
|
|
|
|
for(i = 0; i < numLines; i++)
|
|
{
|
|
error = clReleaseProgram( simple_kernels[i] );
|
|
test_error( error, "Unable to release program object" );
|
|
error = clReleaseProgram( headers[i] );
|
|
test_error( error, "Unable to release header program object" );
|
|
}
|
|
free( simple_kernels );
|
|
free( headers );
|
|
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseProgram( my_newly_minted_library );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_multiple_embedded_headers(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
unsigned int toTest[] = { 2, 4, 8, 16, 32, 64, 128, 256, 0 }; // 512, 1024, 2048, 4096, 8192, 16384, 32768, 0 };
|
|
unsigned int i;
|
|
|
|
log_info( "Testing multiple embedded headers ...this might take awhile...\n" );
|
|
|
|
for( i = 0; toTest[ i ] != 0; i++ )
|
|
{
|
|
log_info( " %d...\n", toTest[ i ] );
|
|
|
|
#if defined(_WIN32)
|
|
clock_t start = clock();
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
timeval time1, time2;
|
|
gettimeofday(&time1, NULL);
|
|
#endif
|
|
|
|
if( test_large_multiple_embedded_headers( context, deviceID, queue, toTest[ i ] ) != 0 )
|
|
{
|
|
log_error( "ERROR: multiple embedded headers program test failed for %d lines! (in %s:%d)\n", toTest[ i ], __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
#if defined(_WIN32)
|
|
clock_t end = clock();
|
|
log_perf( (float)( end - start ) / (float)CLOCKS_PER_SEC, false, "clock() time in secs", "%d lines", toTest[i] );
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
gettimeofday(&time2, NULL);
|
|
log_perf( (float)(float)(time2.tv_sec - time1.tv_sec) + 1.0e-6 * (time2.tv_usec - time1.tv_usec) , false, "wall time in secs", "%d lines", toTest[i] );
|
|
#endif
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
double logbase(double a, double base)
|
|
{
|
|
return log(a) / log(base);
|
|
}
|
|
|
|
int test_large_multiple_libraries(cl_context context, cl_device_id deviceID, cl_command_queue queue, unsigned int numLines)
|
|
{
|
|
int error;
|
|
cl_program *simple_kernels;
|
|
const char **lines;
|
|
unsigned int i;
|
|
char buffer[MAX_LINE_SIZE_IN_PROGRAM];
|
|
/* I want to create (log2(N)+1)/2 libraries */
|
|
unsigned int level = (unsigned int)(logbase(numLines, 2.0) + 1.000001)/2;
|
|
unsigned int numLibraries = (unsigned int)pow(2.0, level - 1.0);
|
|
unsigned int numFilesInLib = numLines/numLibraries;
|
|
cl_program *my_program_and_libraries = (cl_program*)malloc((1+numLibraries)*sizeof(cl_program));
|
|
if (my_program_and_libraries == NULL) {
|
|
log_error( "ERROR: Unable to allocate program array with %d programs! (in %s:%d)\n", (1+numLibraries), __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
|
|
log_info("level - %d, numLibraries - %d, numFilesInLib - %d\n", level, numLibraries, numFilesInLib);
|
|
|
|
simple_kernels = (cl_program*)malloc(numLines*sizeof(cl_program));
|
|
if (simple_kernels == NULL) {
|
|
log_error( "ERROR: Unable to allocate kernels array with %d kernels! (in %s:%d)\n", numLines, __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
/* First, allocate the array for our line pointers */
|
|
lines = (const char **)malloc( (2*numLines + 2) * sizeof( const char * ) );
|
|
if (lines == NULL) {
|
|
log_error( "ERROR: Unable to allocate lines array with %d lines! (in %s:%d)\n", (2*numLines + 2), __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
|
|
for(i = 0; i < numLines; i++)
|
|
{
|
|
sprintf(buffer, composite_kernel_extern_template, i);
|
|
lines[i] = _strdup(buffer);
|
|
}
|
|
/* First and last lines are easy */
|
|
lines[ numLines ] = composite_kernel_start;
|
|
lines[ 2*numLines + 1] = composite_kernel_end;
|
|
|
|
/* Fill the rest with templated kernels */
|
|
for(i = numLines + 1; i < 2*numLines + 1; i++ )
|
|
{
|
|
sprintf(buffer, composite_kernel_template, i - numLines - 1);
|
|
lines[ i ] = _strdup(buffer);
|
|
}
|
|
|
|
/* Try to create a program with these lines */
|
|
error = create_single_kernel_helper_create_program(context, &my_program_and_libraries[0], 2 * numLines + 2, lines);
|
|
if( my_program_and_libraries[0] == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create long test program with %d lines! (%s in %s:%d)\n", numLines, IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
/* Compile it */
|
|
error = clCompileProgram(my_program_and_libraries[0], 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
/* Create and compile templated kernels */
|
|
for(i = 0; i < numLines; i++)
|
|
{
|
|
sprintf(buffer, simple_kernel_template, i);
|
|
const char* kernel_source = _strdup(buffer);
|
|
error = create_single_kernel_helper_create_program(context, &simple_kernels[i], 1, &kernel_source);
|
|
if( simple_kernels[i] == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create long test program with %d lines! (%s in %s:%d)\n", numLines, IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
/* Compile it */
|
|
error = clCompileProgram(simple_kernels[i], 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
free((void*)kernel_source);
|
|
}
|
|
|
|
/* Create library out of compiled templated kernels */
|
|
for(i = 0; i < numLibraries; i++) {
|
|
my_program_and_libraries[i+1] = clLinkProgram(context, 1, &deviceID, "-create-library", numFilesInLib, simple_kernels+i*numFilesInLib, NULL, NULL, &error);
|
|
test_error( error, "Unable to create a multi-line library" );
|
|
}
|
|
|
|
/* Link the program that calls the kernels and the library that contains them */
|
|
cl_program my_newly_linked_program = clLinkProgram(context, 1, &deviceID, NULL, numLibraries+1, my_program_and_libraries, NULL, NULL, &error);
|
|
test_error( error, "Unable to link a program with a library" );
|
|
|
|
// Create the composite kernel
|
|
cl_kernel kernel = clCreateKernel(my_newly_linked_program, "CompositeKernel", &error);
|
|
test_error( error, "Unable to create a composite kernel" );
|
|
|
|
// Run the composite kernel and verify the results
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
for(i = 0; i <= numLibraries; i++) {
|
|
error = clReleaseProgram( my_program_and_libraries[i] );
|
|
test_error( error, "Unable to release program object" );
|
|
}
|
|
free( my_program_and_libraries );
|
|
for(i = 0; i < numLines; i++)
|
|
{
|
|
free( (void*)lines[i] );
|
|
}
|
|
for(i = numLines + 1; i < 2*numLines + 1; i++ )
|
|
{
|
|
free( (void*)lines[i] );
|
|
}
|
|
free( lines );
|
|
|
|
for(i = 0; i < numLines; i++)
|
|
{
|
|
error = clReleaseProgram( simple_kernels[i] );
|
|
test_error( error, "Unable to release program object" );
|
|
}
|
|
free( simple_kernels );
|
|
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_multiple_libraries(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
unsigned int toTest[] = { 2, 8, 32, 128, 256, 0 }; // 512, 2048, 8192, 32768, 0 };
|
|
unsigned int i;
|
|
|
|
log_info( "Testing multiple libraries ...this might take awhile...\n" );
|
|
|
|
for( i = 0; toTest[ i ] != 0; i++ )
|
|
{
|
|
log_info( " %d...\n", toTest[ i ] );
|
|
|
|
#if defined(_WIN32)
|
|
clock_t start = clock();
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
timeval time1, time2;
|
|
gettimeofday(&time1, NULL);
|
|
#endif
|
|
|
|
if( test_large_multiple_libraries( context, deviceID, queue, toTest[ i ] ) != 0 )
|
|
{
|
|
log_error( "ERROR: multiple library program test failed for %d lines! (in %s:%d)\n\n", toTest[ i ], __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
#if defined(_WIN32)
|
|
clock_t end = clock();
|
|
log_perf( (float)( end - start ) / (float)CLOCKS_PER_SEC, false, "clock() time in secs", "%d lines", toTest[i] );
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
gettimeofday(&time2, NULL);
|
|
log_perf( (float)(float)(time2.tv_sec - time1.tv_sec) + 1.0e-6 * (time2.tv_usec - time1.tv_usec) , false, "wall time in secs", "%d lines", toTest[i] );
|
|
#endif
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_large_multiple_files_multiple_libraries(cl_context context, cl_device_id deviceID, cl_command_queue queue, unsigned int numLines)
|
|
{
|
|
int error;
|
|
cl_program *simple_kernels;
|
|
const char **lines;
|
|
unsigned int i;
|
|
char buffer[MAX_LINE_SIZE_IN_PROGRAM];
|
|
/* I want to create (log2(N)+1)/4 libraries */
|
|
unsigned int level = (unsigned int)(logbase(numLines, 2.0) + 1.000001)/2;
|
|
unsigned int numLibraries = (unsigned int)pow(2.0, level - 2.0);
|
|
unsigned int numFilesInLib = numLines/(2*numLibraries);
|
|
cl_program *my_programs_and_libraries = (cl_program*)malloc((1+numLibraries+numLibraries*numFilesInLib)*sizeof(cl_program));
|
|
if (my_programs_and_libraries == NULL) {
|
|
log_error( "ERROR: Unable to allocate program array with %d programs! (in %s:%d)\n", (1+numLibraries+numLibraries*numFilesInLib), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
log_info("level - %d, numLibraries - %d, numFilesInLib - %d\n", level, numLibraries, numFilesInLib);
|
|
|
|
simple_kernels = (cl_program*)malloc(numLines*sizeof(cl_program));
|
|
if (simple_kernels == NULL) {
|
|
log_error( "ERROR: Unable to allocate kernels array with %d kernels! (in %s:%d)\n", numLines, __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
/* First, allocate the array for our line pointers */
|
|
lines = (const char **)malloc( (2*numLines + 2) * sizeof( const char * ) );
|
|
if (lines == NULL) {
|
|
log_error( "ERROR: Unable to allocate lines array with %d lines! (in %s:%d)\n", (2*numLines + 2), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
for(i = 0; i < numLines; i++)
|
|
{
|
|
sprintf(buffer, composite_kernel_extern_template, i);
|
|
lines[i] = _strdup(buffer);
|
|
}
|
|
/* First and last lines are easy */
|
|
lines[ numLines ] = composite_kernel_start;
|
|
lines[ 2*numLines + 1] = composite_kernel_end;
|
|
|
|
/* Fill the rest with templated kernels */
|
|
for(i = numLines + 1; i < 2*numLines + 1; i++ )
|
|
{
|
|
sprintf(buffer, composite_kernel_template, i - numLines - 1);
|
|
lines[ i ] = _strdup(buffer);
|
|
}
|
|
|
|
/* Try to create a program with these lines */
|
|
error = create_single_kernel_helper_create_program(context, &my_programs_and_libraries[0], 2 * numLines + 2, lines);
|
|
if( my_programs_and_libraries[0] == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create long test program with %d lines! (%s in %s:%d)\n", numLines, IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
/* Compile it */
|
|
error = clCompileProgram(my_programs_and_libraries[0], 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
/* Create and compile templated kernels */
|
|
for(i = 0; i < numLines; i++)
|
|
{
|
|
sprintf(buffer, simple_kernel_template, i);
|
|
const char* kernel_source = _strdup(buffer);
|
|
error = create_single_kernel_helper_create_program(context, &simple_kernels[i], 1, &kernel_source);
|
|
if( simple_kernels[i] == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create long test program with %d lines! (%s in %s:%d)\n", numLines, IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
/* Compile it */
|
|
error = clCompileProgram(simple_kernels[i], 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
free((void*)kernel_source);
|
|
}
|
|
|
|
/* Copy already compiled kernels */
|
|
for( i = 0; i < numLibraries*numFilesInLib; i++) {
|
|
my_programs_and_libraries[i+1] = simple_kernels[i];
|
|
}
|
|
|
|
/* Create library out of compiled templated kernels */
|
|
for( i = 0; i < numLibraries; i++) {
|
|
my_programs_and_libraries[i+1+numLibraries*numFilesInLib] = clLinkProgram(context, 1, &deviceID, "-create-library", numFilesInLib, simple_kernels+(i*numFilesInLib+numLibraries*numFilesInLib), NULL, NULL, &error);
|
|
test_error( error, "Unable to create a multi-line library" );
|
|
}
|
|
|
|
/* Link the program that calls the kernels and the library that contains them */
|
|
cl_program my_newly_linked_program = clLinkProgram(context, 1, &deviceID, NULL, numLibraries+1+numLibraries*numFilesInLib, my_programs_and_libraries, NULL, NULL, &error);
|
|
test_error( error, "Unable to link a program with a library" );
|
|
|
|
// Create the composite kernel
|
|
cl_kernel kernel = clCreateKernel(my_newly_linked_program, "CompositeKernel", &error);
|
|
test_error( error, "Unable to create a composite kernel" );
|
|
|
|
// Run the composite kernel and verify the results
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
for(i = 0; i < numLibraries+1+numLibraries*numFilesInLib; i++) {
|
|
error = clReleaseProgram( my_programs_and_libraries[i] );
|
|
test_error( error, "Unable to release program object" );
|
|
}
|
|
free( my_programs_and_libraries );
|
|
|
|
for(i = 0; i < numLines; i++)
|
|
{
|
|
free( (void*)lines[i] );
|
|
}
|
|
for(i = numLines + 1; i < 2*numLines + 1; i++ )
|
|
{
|
|
free( (void*)lines[i] );
|
|
}
|
|
free( lines );
|
|
|
|
for(i = numLibraries*numFilesInLib; i < numLines; i++)
|
|
{
|
|
error = clReleaseProgram( simple_kernels[i] );
|
|
test_error( error, "Unable to release program object" );
|
|
}
|
|
free( simple_kernels );
|
|
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_multiple_files_multiple_libraries(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
unsigned int toTest[] = { 8, 32, 128, 256, 0 }; // 512, 2048, 8192, 32768, 0 };
|
|
unsigned int i;
|
|
|
|
log_info( "Testing multiple files and multiple libraries ...this might take awhile...\n" );
|
|
|
|
for( i = 0; toTest[ i ] != 0; i++ )
|
|
{
|
|
log_info( " %d...\n", toTest[ i ] );
|
|
|
|
#if defined(_WIN32)
|
|
clock_t start = clock();
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
timeval time1, time2;
|
|
gettimeofday(&time1, NULL);
|
|
#endif
|
|
|
|
if( test_large_multiple_files_multiple_libraries( context, deviceID, queue, toTest[ i ] ) != 0 )
|
|
{
|
|
log_error( "ERROR: multiple files, multiple libraries program test failed for %d lines! (in %s:%d)\n\n", toTest[ i ], __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
#if defined(_WIN32)
|
|
clock_t end = clock();
|
|
log_perf( (float)( end - start ) / (float)CLOCKS_PER_SEC, false, "clock() time in secs", "%d lines", toTest[i] );
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
gettimeofday(&time2, NULL);
|
|
log_perf( (float)(float)(time2.tv_sec - time1.tv_sec) + 1.0e-6 * (time2.tv_usec - time1.tv_usec) , false, "wall time in secs", "%d lines", toTest[i] );
|
|
#endif
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_large_multiple_files(cl_context context, cl_device_id deviceID, cl_command_queue queue, unsigned int numLines)
|
|
{
|
|
int error;
|
|
const char **lines;
|
|
unsigned int i;
|
|
char buffer[MAX_LINE_SIZE_IN_PROGRAM];
|
|
cl_program *my_programs = (cl_program*)malloc((1+numLines)*sizeof(cl_program));
|
|
|
|
if (my_programs == NULL) {
|
|
log_error( "ERROR: Unable to allocate my_programs array with %d programs! (in %s:%d)\n", (1+numLines), __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
/* First, allocate the array for our line pointers */
|
|
lines = (const char **)malloc( (2*numLines + 2) * sizeof( const char * ) );
|
|
if (lines == NULL) {
|
|
log_error( "ERROR: Unable to allocate lines array with %d lines! (in %s:%d)\n", (2*numLines + 2), __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
|
|
for(i = 0; i < numLines; i++)
|
|
{
|
|
sprintf(buffer, composite_kernel_extern_template, i);
|
|
lines[i] = _strdup(buffer);
|
|
}
|
|
/* First and last lines are easy */
|
|
lines[ numLines ] = composite_kernel_start;
|
|
lines[ 2* numLines + 1] = composite_kernel_end;
|
|
|
|
/* Fill the rest with templated kernels */
|
|
for(i = numLines + 1; i < 2*numLines + 1; i++ )
|
|
{
|
|
sprintf(buffer, composite_kernel_template, i - numLines - 1);
|
|
lines[ i ] = _strdup(buffer);
|
|
}
|
|
|
|
/* Try to create a program with these lines */
|
|
error = create_single_kernel_helper_create_program(context, &my_programs[0], 2 * numLines + 2, lines);
|
|
if( my_programs[0] == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create long test program with %d lines! (%s in %s:%d)\n", numLines, IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
/* Compile it */
|
|
error = clCompileProgram(my_programs[0], 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
/* Create and compile templated kernels */
|
|
for( i = 0; i < numLines; i++)
|
|
{
|
|
sprintf(buffer, simple_kernel_template, i);
|
|
const char* kernel_source = _strdup(buffer);
|
|
error = create_single_kernel_helper_create_program(context, &my_programs[i + 1], 1, &kernel_source);
|
|
if( my_programs[i+1] == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create long test program with %d lines! (%s in %s:%d)\n", numLines, IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
/* Compile it */
|
|
error = clCompileProgram(my_programs[i+1], 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
free((void*)kernel_source);
|
|
}
|
|
|
|
/* Link the program that calls the kernels and the library that contains them */
|
|
cl_program my_newly_linked_program = clLinkProgram(context, 1, &deviceID, NULL, 1+numLines, my_programs, NULL, NULL, &error);
|
|
test_error( error, "Unable to link a program with a library" );
|
|
|
|
// Create the composite kernel
|
|
cl_kernel kernel = clCreateKernel(my_newly_linked_program, "CompositeKernel", &error);
|
|
test_error( error, "Unable to create a composite kernel" );
|
|
|
|
// Run the composite kernel and verify the results
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
for(i = 0; i < 1+numLines; i++) {
|
|
error = clReleaseProgram( my_programs[i] );
|
|
test_error( error, "Unable to release program object" );
|
|
}
|
|
free( my_programs );
|
|
for(i = 0; i < numLines; i++)
|
|
{
|
|
free( (void*)lines[i] );
|
|
}
|
|
for(i = numLines + 1; i < 2*numLines + 1; i++ )
|
|
{
|
|
free( (void*)lines[i] );
|
|
}
|
|
free( lines );
|
|
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_multiple_files(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
unsigned int toTest[] = { 8, 32, 128, 256, 0 }; // 512, 2048, 8192, 32768, 0 };
|
|
unsigned int i;
|
|
|
|
log_info( "Testing multiple files compilation and linking into a single executable ...this might take awhile...\n" );
|
|
|
|
for( i = 0; toTest[ i ] != 0; i++ )
|
|
{
|
|
log_info( " %d...\n", toTest[ i ] );
|
|
|
|
#if defined(_WIN32)
|
|
clock_t start = clock();
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
timeval time1, time2;
|
|
gettimeofday(&time1, NULL);
|
|
#endif
|
|
|
|
if( test_large_multiple_files( context, deviceID, queue, toTest[ i ] ) != 0 )
|
|
{
|
|
log_error( "ERROR: multiple files program test failed for %d lines! (in %s:%d)\n\n", toTest[ i ], __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
#if defined(_WIN32)
|
|
clock_t end = clock();
|
|
log_perf( (float)( end - start ) / (float)CLOCKS_PER_SEC, false, "clock() time in secs", "%d lines", toTest[i] );
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
gettimeofday(&time2, NULL);
|
|
log_perf( (float)(float)(time2.tv_sec - time1.tv_sec) + 1.0e-6 * (time2.tv_usec - time1.tv_usec) , false, "wall time in secs", "%d lines", toTest[i] );
|
|
#endif
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_simple_compile_only(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
|
|
log_info("Testing a simple compilation only...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_simple_static_compile_only(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
|
|
log_info("Testing a simple static compilations only...\n");
|
|
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &compile_static_var);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple static variable test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
log_info("Compiling a static variable...\n");
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple static variable program" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &compile_static_struct);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple static struct test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
log_info("Compiling a static struct...\n");
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple static variable program" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &compile_static_function);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple static function test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
log_info("Compiling a static function...\n");
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple static function program" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_simple_extern_compile_only(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
|
|
log_info("Testing a simple extern compilations only...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_header);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple extern kernel test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
log_info("Compiling an extern kernel...\n");
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple extern kernel program" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &compile_extern_var);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple extern variable test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
log_info("Compiling an extern variable...\n");
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple extern variable program" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &compile_extern_struct);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple extern struct test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
log_info("Compiling an extern struct...\n");
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple extern variable program" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &compile_extern_function);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple extern function test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
log_info("Compiling an extern function...\n");
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple extern function program" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
struct simple_user_data {
|
|
const char* m_message;
|
|
cl_event m_event;
|
|
};
|
|
|
|
const char* once_upon_a_midnight_dreary = "Once upon a midnight dreary!";
|
|
|
|
static void CL_CALLBACK simple_compile_callback(cl_program program, void* user_data)
|
|
{
|
|
simple_user_data* simple_compile_user_data = (simple_user_data*)user_data;
|
|
log_info("in the simple_compile_callback: program %p just completed compiling with '%s'\n", program, simple_compile_user_data->m_message);
|
|
if (strcmp(once_upon_a_midnight_dreary, simple_compile_user_data->m_message) != 0)
|
|
{
|
|
log_error("ERROR: in the simple_compile_callback: Expected '%s' and got %s (in %s:%d)!\n", once_upon_a_midnight_dreary, simple_compile_user_data->m_message, __FILE__, __LINE__);
|
|
}
|
|
|
|
int error;
|
|
log_info("in the simple_compile_callback: program %p just completed compiling with '%p'\n", program, simple_compile_user_data->m_event);
|
|
|
|
error = clSetUserEventStatus(simple_compile_user_data->m_event, CL_COMPLETE);
|
|
if (error != CL_SUCCESS)
|
|
{
|
|
log_error( "ERROR: in the simple_compile_callback: Unable to set user event status to CL_COMPLETE! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
exit(-1);
|
|
}
|
|
log_info("in the simple_compile_callback: Successfully signaled compile_program_completion_event!\n");
|
|
}
|
|
|
|
int test_simple_compile_with_callback(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
cl_event compile_program_completion_event;
|
|
|
|
log_info("Testing a simple compilation with callback...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
compile_program_completion_event = clCreateUserEvent(context, &error);
|
|
test_error( error, "Unable to create a user event");
|
|
|
|
simple_user_data simple_compile_user_data = {once_upon_a_midnight_dreary, compile_program_completion_event};
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, simple_compile_callback, (void*)&simple_compile_user_data);
|
|
test_error( error, "Unable to compile a simple program with a callback" );
|
|
|
|
error = clWaitForEvents(1, &compile_program_completion_event);
|
|
test_error( error, "clWaitForEvents failed when waiting on compile_program_completion_event");
|
|
|
|
/* All done! */
|
|
error = clReleaseEvent(compile_program_completion_event);
|
|
test_error( error, "Unable to release event object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_simple_embedded_header_compile(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program, header;
|
|
|
|
log_info("Testing a simple embedded header compile only...\n");
|
|
program = clCreateProgramWithSource(context, 1, &another_simple_kernel_with_header, NULL, &error);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
header = clCreateProgramWithSource(context, 1, &simple_header, NULL, &error);
|
|
if( header == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple header program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 1, &header, &simple_header_name, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program with embedded header" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( header );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_simple_link_only(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
|
|
log_info("Testing a simple linking only...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program my_newly_linked_program = clLinkProgram(context, 1, &deviceID, NULL, 1, &program, NULL, NULL, &error);
|
|
test_error( error, "Unable to link a simple program" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_two_file_regular_variable_access(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program, second_program, my_newly_linked_program;
|
|
|
|
const char* sources[2] = {simple_kernel, compile_regular_var}; // here we want to avoid linking error due to lack of kernels
|
|
log_info("Compiling and linking two program objects, where one tries to access regular variable from another...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 2, sources);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a test program with regular variable! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program with regular function" );
|
|
|
|
error = create_single_kernel_helper_create_program(context, &second_program, 1, &link_static_var_access);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a test program that tries to access a regular variable! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(second_program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a program that tries to access a regular variable" );
|
|
|
|
cl_program two_programs[2] = { program, second_program };
|
|
my_newly_linked_program = clLinkProgram(context, 1, &deviceID, NULL, 2, two_programs, NULL, NULL, &error);
|
|
test_error( error, "clLinkProgram: Expected a different error code while linking a program that tries to access a regular variable" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( second_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_two_file_regular_struct_access(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program, second_program, my_newly_linked_program;
|
|
|
|
const char* sources[2] = {simple_kernel, compile_regular_struct}; // here we want to avoid linking error due to lack of kernels
|
|
log_info("Compiling and linking two program objects, where one tries to access regular struct from another...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 2, sources);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a test program with regular struct! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program with regular struct" );
|
|
|
|
error = create_single_kernel_helper_create_program(context, &second_program, 1, &link_static_struct_access);
|
|
if( second_program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a test program that tries to access a regular struct! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(second_program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a program that tries to access a regular struct" );
|
|
|
|
cl_program two_programs[2] = { program, second_program };
|
|
my_newly_linked_program = clLinkProgram(context, 1, &deviceID, NULL, 2, two_programs, NULL, NULL, &error);
|
|
test_error( error, "clLinkProgram: Expected a different error code while linking a program that tries to access a regular struct" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( second_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
|
|
int test_two_file_regular_function_access(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program, second_program, my_newly_linked_program;
|
|
|
|
const char* sources[2] = {simple_kernel, compile_regular_function}; // here we want to avoid linking error due to lack of kernels
|
|
log_info("Compiling and linking two program objects, where one tries to access regular function from another...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 2, sources);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a test program with regular function! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program with regular function" );
|
|
|
|
error = create_single_kernel_helper_create_program(context, &second_program, 1, &link_static_function_access);
|
|
if( second_program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a test program that tries to access a regular function! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(second_program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a program that tries to access a regular function" );
|
|
|
|
cl_program two_programs[2] = { program, second_program };
|
|
my_newly_linked_program = clLinkProgram(context, 1, &deviceID, NULL, 2, two_programs, NULL, NULL, &error);
|
|
test_error( error, "clLinkProgram: Expected a different error code while linking a program that tries to access a regular function" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( second_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_simple_embedded_header_link(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program, header, simple_program;
|
|
|
|
log_info("Testing a simple embedded header link...\n");
|
|
program = clCreateProgramWithSource(context, 1, &another_simple_kernel_with_header, NULL, &error);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
header = clCreateProgramWithSource(context, 1, &simple_header, NULL, &error);
|
|
if( header == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple header program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 1, &header, &simple_header_name, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program with embedded header" );
|
|
|
|
error = create_single_kernel_helper_create_program(context, &simple_program, 1, &simple_kernel);
|
|
if( simple_program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(simple_program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program two_programs[2] = { program, simple_program };
|
|
cl_program fully_linked_program = clLinkProgram(context, 1, &deviceID, "", 2, two_programs, NULL, NULL, &error);
|
|
test_error( error, "Unable to create an executable from two binaries, one compiled with embedded header" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( header );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( simple_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( fully_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
const char* when_i_pondered_weak_and_weary = "When I pondered weak and weary!";
|
|
|
|
static void CL_CALLBACK simple_link_callback(cl_program program, void* user_data)
|
|
{
|
|
simple_user_data* simple_link_user_data = (simple_user_data*)user_data;
|
|
log_info("in the simple_link_callback: program %p just completed linking with '%s'\n", program, (const char*)simple_link_user_data->m_message);
|
|
if (strcmp(when_i_pondered_weak_and_weary, simple_link_user_data->m_message) != 0)
|
|
{
|
|
log_error("ERROR: in the simple_compile_callback: Expected '%s' and got %s! (in %s:%d)\n", when_i_pondered_weak_and_weary, simple_link_user_data->m_message, __FILE__, __LINE__);
|
|
}
|
|
|
|
int error;
|
|
log_info("in the simple_link_callback: program %p just completed linking with '%p'\n", program, simple_link_user_data->m_event);
|
|
|
|
error = clSetUserEventStatus(simple_link_user_data->m_event, CL_COMPLETE);
|
|
if (error != CL_SUCCESS)
|
|
{
|
|
log_error( "ERROR: simple_link_callback: Unable to set user event status to CL_COMPLETE! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
exit(-1);
|
|
}
|
|
log_info("in the simple_link_callback: Successfully signaled link_program_completion_event event!\n");
|
|
}
|
|
|
|
int test_simple_link_with_callback(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
cl_event link_program_completion_event;
|
|
|
|
log_info("Testing a simple linking with callback...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
link_program_completion_event = clCreateUserEvent(context, &error);
|
|
test_error( error, "Unable to create a user event");
|
|
|
|
simple_user_data simple_link_user_data = {when_i_pondered_weak_and_weary, link_program_completion_event};
|
|
|
|
cl_program my_linked_library = clLinkProgram(context, 1, &deviceID, NULL, 1, &program, simple_link_callback, (void*)&simple_link_user_data, &error);
|
|
test_error( error, "Unable to link a simple program" );
|
|
|
|
error = clWaitForEvents(1, &link_program_completion_event);
|
|
test_error( error, "clWaitForEvents failed when waiting on link_program_completion_event");
|
|
|
|
/* All done! */
|
|
error = clReleaseEvent(link_program_completion_event);
|
|
test_error( error, "Unable to release event object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_linked_library );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
static void initBuffer(float* & srcBuffer, unsigned int cnDimension)
|
|
{
|
|
float num = 0.0f;
|
|
|
|
for( unsigned int i = 0; i < cnDimension; i++ )
|
|
{
|
|
if( ( i % 10 ) == 0 )
|
|
{
|
|
num = 0.0f;
|
|
}
|
|
|
|
srcBuffer[ i ] = num;
|
|
num = num + 1.0f;
|
|
}
|
|
}
|
|
|
|
static int verifyCopyBuffer(cl_context context, cl_command_queue queue, cl_kernel kernel)
|
|
{
|
|
int error, result = CL_SUCCESS;
|
|
const size_t cnDimension = 32;
|
|
|
|
// Allocate source buffer
|
|
float * srcBuffer = (float*)malloc(cnDimension * sizeof(float));
|
|
float * dstBuffer = (float*)malloc(cnDimension * sizeof(float));
|
|
|
|
if (srcBuffer == NULL) {
|
|
log_error( "ERROR: Unable to allocate srcBuffer float array with %lu floats! (in %s:%d)\n", cnDimension, __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
if (dstBuffer == NULL) {
|
|
log_error( "ERROR: Unable to allocate dstBuffer float array with %lu floats! (in %s:%d)\n", cnDimension, __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
|
|
if( srcBuffer && dstBuffer )
|
|
{
|
|
// initialize host memory
|
|
initBuffer(srcBuffer, cnDimension );
|
|
|
|
// Allocate device memory
|
|
cl_mem deviceMemSrc = clCreateBuffer(context, CL_MEM_READ_ONLY | CL_MEM_COPY_HOST_PTR,
|
|
cnDimension * sizeof( cl_float ), srcBuffer, &error);
|
|
test_error( error, "Unable to create a source memory buffer" );
|
|
|
|
cl_mem deviceMemDst = clCreateBuffer(context, CL_MEM_WRITE_ONLY,
|
|
cnDimension * sizeof( cl_float ), 0, &error);
|
|
test_error( error, "Unable to create a destination memory buffer" );
|
|
|
|
// Set kernel args
|
|
// Set parameter 0 to be the source buffer
|
|
error = clSetKernelArg(kernel, 0, sizeof( cl_mem ), ( void * )&deviceMemSrc );
|
|
test_error( error, "Unable to set the first kernel argument" );
|
|
|
|
// Set parameter 1 to be the destination buffer
|
|
error = clSetKernelArg(kernel, 1, sizeof( cl_mem ), ( void * )&deviceMemDst );
|
|
test_error( error, "Unable to set the second kernel argument" );
|
|
|
|
// Execute kernel
|
|
error = clEnqueueNDRangeKernel(queue, kernel, 1, NULL,
|
|
&cnDimension, 0, 0, NULL, NULL );
|
|
test_error( error, "Unable to enqueue kernel" );
|
|
|
|
error = clFlush( queue );
|
|
test_error( error, "Unable to flush the queue" );
|
|
|
|
// copy results from device back to host
|
|
error = clEnqueueReadBuffer(queue, deviceMemDst, CL_TRUE, 0, cnDimension * sizeof( cl_float ),
|
|
dstBuffer, 0, NULL, NULL );
|
|
test_error( error, "Unable to read the destination buffer" );
|
|
|
|
error = clFlush( queue );
|
|
test_error( error, "Unable to flush the queue" );
|
|
|
|
// Compare the source and destination buffers
|
|
const int* pSrc = (int*)srcBuffer;
|
|
const int* pDst = (int*)dstBuffer;
|
|
int mismatch = 0;
|
|
|
|
for( size_t i = 0; i < cnDimension; i++ )
|
|
{
|
|
if( pSrc[i] != pDst[i] )
|
|
{
|
|
if( mismatch < 4 )
|
|
{
|
|
log_info("Offset %08lX: Expected %08X, Got %08X\n", i * 4, pSrc[i], pDst[i] );
|
|
}
|
|
else
|
|
{
|
|
log_info(".");
|
|
}
|
|
mismatch++;
|
|
}
|
|
}
|
|
|
|
if( mismatch )
|
|
{
|
|
log_info("*** %d mismatches found, TEST FAILS! ***\n", mismatch );
|
|
result = -1;
|
|
}
|
|
else
|
|
{
|
|
log_info("Buffers match, test passes.\n");
|
|
}
|
|
|
|
free( srcBuffer );
|
|
srcBuffer = NULL;
|
|
free( dstBuffer );
|
|
dstBuffer = NULL;
|
|
|
|
if( deviceMemSrc )
|
|
{
|
|
error = clReleaseMemObject( deviceMemSrc );
|
|
test_error( error, "Unable to release memory object" );
|
|
}
|
|
|
|
if( deviceMemDst )
|
|
{
|
|
error = clReleaseMemObject( deviceMemDst );
|
|
test_error( error, "Unable to release memory object" );
|
|
}
|
|
}
|
|
return result;
|
|
}
|
|
|
|
int test_execute_after_simple_compile_and_link(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
|
|
log_info("Testing execution after a simple compile and link...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program my_newly_linked_program = clLinkProgram(context, 1, &deviceID, NULL, 1, &program, NULL, NULL, &error);
|
|
test_error( error, "Unable to link a simple program" );
|
|
|
|
cl_kernel kernel = clCreateKernel(my_newly_linked_program, "CopyBuffer", &error);
|
|
test_error( error, "Unable to create a simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_execute_after_simple_compile_and_link_no_device_info(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
|
|
log_info("Testing execution after a simple compile and link with no device information provided...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 0, NULL, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program my_newly_linked_program = clLinkProgram(context, 0, NULL, NULL, 1, &program, NULL, NULL, &error);
|
|
test_error( error, "Unable to link a simple program" );
|
|
|
|
cl_kernel kernel = clCreateKernel(my_newly_linked_program, "CopyBuffer", &error);
|
|
test_error( error, "Unable to create a simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_execute_after_simple_compile_and_link_with_defines(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
|
|
log_info("Testing execution after a simple compile and link with defines...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel_with_defines, "-DFIRST=5 -DSECOND=37");
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, "-DFIRST=5 -DSECOND=37", 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program my_newly_linked_program = clLinkProgram(context, 1, &deviceID, NULL, 1, &program, NULL, NULL, &error);
|
|
test_error( error, "Unable to link a simple program" );
|
|
|
|
cl_kernel kernel = clCreateKernel(my_newly_linked_program, "CopyBuffer", &error);
|
|
test_error( error, "Unable to create a simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_execute_after_serialize_reload_object(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
size_t binarySize;
|
|
unsigned char *binary;
|
|
|
|
log_info("Testing execution after serialization and reloading of the object...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
// Get the size of the resulting binary (only one device)
|
|
error = clGetProgramInfo( program, CL_PROGRAM_BINARY_SIZES, sizeof( binarySize ), &binarySize, NULL );
|
|
test_error( error, "Unable to get binary size" );
|
|
|
|
// Sanity check
|
|
if( binarySize == 0 )
|
|
{
|
|
log_error( "ERROR: Binary size of program is zero (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
// Create a buffer and get the actual binary
|
|
binary = (unsigned char*)malloc(sizeof(unsigned char)*binarySize);
|
|
if (binary == NULL) {
|
|
log_error( "ERROR: Unable to allocate binary character array with %lu characters! (in %s:%d)\n", binarySize, __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
unsigned char *buffers[ 1 ] = { binary };
|
|
cl_int loadErrors[ 1 ];
|
|
|
|
// Do another sanity check here first
|
|
size_t size;
|
|
error = clGetProgramInfo( program, CL_PROGRAM_BINARIES, 0, NULL, &size );
|
|
test_error( error, "Unable to get expected size of binaries array" );
|
|
if( size != sizeof( buffers ) )
|
|
{
|
|
log_error( "ERROR: Expected size of binaries array in clGetProgramInfo is incorrect (should be %d, got %d) (in %s:%d)\n", (int)sizeof( buffers ), (int)size, __FILE__, __LINE__ );
|
|
free(binary);
|
|
return -1;
|
|
}
|
|
|
|
error = clGetProgramInfo( program, CL_PROGRAM_BINARIES, sizeof( buffers ), &buffers, NULL );
|
|
test_error( error, "Unable to get program binary" );
|
|
|
|
// use clCreateProgramWithBinary
|
|
cl_program program_with_binary = clCreateProgramWithBinary(context, 1, &deviceID, &binarySize, (const unsigned char**)buffers, loadErrors, &error);
|
|
test_error( error, "Unable to create program with binary" );
|
|
|
|
cl_program my_newly_linked_program = clLinkProgram(context, 1, &deviceID, NULL, 1, &program_with_binary, NULL, NULL, &error);
|
|
test_error( error, "Unable to link a simple program" );
|
|
|
|
cl_kernel kernel = clCreateKernel(my_newly_linked_program, "CopyBuffer", &error);
|
|
test_error( error, "Unable to create a simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( program_with_binary );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
free(binary);
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_execute_after_serialize_reload_library(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program, another_program;
|
|
size_t binarySize;
|
|
unsigned char *binary;
|
|
|
|
log_info("Testing execution after linking a binary with a simple library...\n");
|
|
// we will test creation of a simple library from one file
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program my_newly_minted_library = clLinkProgram(context, 1, &deviceID, "-create-library", 1, &program, NULL, NULL, &error);
|
|
test_error( error, "Unable to create a simple library" );
|
|
|
|
|
|
// Get the size of the resulting library (only one device)
|
|
error = clGetProgramInfo( my_newly_minted_library, CL_PROGRAM_BINARY_SIZES, sizeof( binarySize ), &binarySize, NULL );
|
|
test_error( error, "Unable to get binary size" );
|
|
|
|
// Sanity check
|
|
if( binarySize == 0 )
|
|
{
|
|
log_error( "ERROR: Binary size of program is zero (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
// Create a buffer and get the actual binary
|
|
binary = (unsigned char*)malloc(sizeof(unsigned char)*binarySize);
|
|
if (binary == NULL) {
|
|
log_error( "ERROR: Unable to allocate binary character array with %lu characters (in %s:%d)!", binarySize, __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
unsigned char *buffers[ 1 ] = { binary };
|
|
cl_int loadErrors[ 1 ];
|
|
|
|
// Do another sanity check here first
|
|
size_t size;
|
|
error = clGetProgramInfo( my_newly_minted_library, CL_PROGRAM_BINARIES, 0, NULL, &size );
|
|
test_error( error, "Unable to get expected size of binaries array" );
|
|
if( size != sizeof( buffers ) )
|
|
{
|
|
log_error( "ERROR: Expected size of binaries array in clGetProgramInfo is incorrect (should be %d, got %d) (in %s:%d)\n", (int)sizeof( buffers ), (int)size, __FILE__, __LINE__ );
|
|
free(binary);
|
|
return -1;
|
|
}
|
|
|
|
error = clGetProgramInfo( my_newly_minted_library, CL_PROGRAM_BINARIES, sizeof( buffers ), &buffers, NULL );
|
|
test_error( error, "Unable to get program binary" );
|
|
|
|
// use clCreateProgramWithBinary
|
|
cl_program library_with_binary = clCreateProgramWithBinary(context, 1, &deviceID, &binarySize, (const unsigned char**)buffers, loadErrors, &error);
|
|
test_error( error, "Unable to create program with binary" );
|
|
|
|
error = create_single_kernel_helper_create_program(context, &another_program, 1, &another_simple_kernel);
|
|
if( another_program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(another_program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program program_and_archive[2] = { another_program, library_with_binary };
|
|
cl_program fully_linked_program = clLinkProgram(context, 1, &deviceID, "", 2, program_and_archive, NULL, NULL, &error);
|
|
test_error( error, "Unable to create an executable from a binary and a library" );
|
|
|
|
cl_kernel kernel = clCreateKernel(fully_linked_program, "CopyBuffer", &error);
|
|
test_error( error, "Unable to create a simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
cl_kernel another_kernel = clCreateKernel(fully_linked_program, "AnotherCopyBuffer", &error);
|
|
test_error( error, "Unable to create another simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, another_kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseKernel( another_kernel );
|
|
test_error( error, "Unable to release another kernel object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( another_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_minted_library );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( library_with_binary );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( fully_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
free(binary);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static void CL_CALLBACK program_compile_completion_callback(cl_program program, void* user_data)
|
|
{
|
|
int error;
|
|
cl_event compile_program_completion_event = (cl_event)user_data;
|
|
log_info("in the program_compile_completion_callback: program %p just completed compiling with '%p'\n", program, compile_program_completion_event);
|
|
|
|
error = clSetUserEventStatus(compile_program_completion_event, CL_COMPLETE);
|
|
if (error != CL_SUCCESS)
|
|
{
|
|
log_error( "ERROR: in the program_compile_completion_callback: Unable to set user event status to CL_COMPLETE! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
exit(-1);
|
|
}
|
|
log_info("in the program_compile_completion_callback: Successfully signaled compile_program_completion_event event!\n");
|
|
}
|
|
|
|
static void CL_CALLBACK program_link_completion_callback(cl_program program, void* user_data)
|
|
{
|
|
int error;
|
|
cl_event link_program_completion_event = (cl_event)user_data;
|
|
log_info("in the program_link_completion_callback: program %p just completed linking with '%p'\n", program, link_program_completion_event);
|
|
|
|
error = clSetUserEventStatus(link_program_completion_event, CL_COMPLETE);
|
|
if (error != CL_SUCCESS)
|
|
{
|
|
log_error( "ERROR: in the program_link_completion_callback: Unable to set user event status to CL_COMPLETE! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
exit(-1);
|
|
}
|
|
log_info("in the program_link_completion_callback: Successfully signaled link_program_completion_event event!\n");
|
|
}
|
|
|
|
int test_execute_after_simple_compile_and_link_with_callbacks(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
cl_event compile_program_completion_event, link_program_completion_event;
|
|
|
|
log_info("Testing execution after a simple compile and link with callbacks...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
compile_program_completion_event = clCreateUserEvent(context, &error);
|
|
test_error( error, "Unable to create a user event");
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL,
|
|
program_compile_completion_callback, (void*)compile_program_completion_event);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
error = clWaitForEvents(1, &compile_program_completion_event);
|
|
test_error( error, "clWaitForEvents failed when waiting on compile_program_completion_event");
|
|
|
|
error = clReleaseEvent(compile_program_completion_event);
|
|
test_error( error, "Unable to release event object" );
|
|
|
|
link_program_completion_event = clCreateUserEvent(context, &error);
|
|
test_error( error, "Unable to create a user event");
|
|
|
|
cl_program my_newly_linked_program = clLinkProgram(context, 1, &deviceID, NULL, 1, &program,
|
|
program_link_completion_callback, (void*)link_program_completion_event, &error);
|
|
test_error( error, "Unable to link a simple program" );
|
|
|
|
error = clWaitForEvents(1, &link_program_completion_event);
|
|
test_error( error, "clWaitForEvents failed when waiting on link_program_completion_event");
|
|
|
|
error = clReleaseEvent(link_program_completion_event);
|
|
test_error( error, "Unable to release event object" );
|
|
|
|
cl_kernel kernel = clCreateKernel(my_newly_linked_program, "CopyBuffer", &error);
|
|
test_error( error, "Unable to create a simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_simple_library_only(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
|
|
log_info("Testing creation of a simple library...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program my_newly_minted_library = clLinkProgram(context, 1, &deviceID, "-create-library", 1, &program, NULL, NULL, &error);
|
|
test_error( error, "Unable to create a simple library" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_minted_library );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_simple_library_with_callback(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
cl_event link_program_completion_event;
|
|
|
|
log_info("Testing creation of a simple library with a callback...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
link_program_completion_event = clCreateUserEvent(context, &error);
|
|
test_error( error, "Unable to create a user event");
|
|
|
|
simple_user_data simple_link_user_data = {when_i_pondered_weak_and_weary, link_program_completion_event};
|
|
|
|
cl_program my_newly_minted_library = clLinkProgram(context, 1, &deviceID, "-create-library", 1, &program,
|
|
simple_link_callback, (void*)&simple_link_user_data, &error);
|
|
test_error( error, "Unable to create a simple library" );
|
|
|
|
error = clWaitForEvents(1, &link_program_completion_event);
|
|
test_error( error, "clWaitForEvents failed when waiting on link_program_completion_event");
|
|
|
|
/* All done! */
|
|
error = clReleaseEvent(link_program_completion_event);
|
|
test_error( error, "Unable to release event object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_minted_library );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_simple_library_with_link(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program, another_program;
|
|
|
|
log_info("Testing creation and linking with a simple library...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program my_newly_minted_library = clLinkProgram(context, 1, &deviceID, "-create-library", 1, &program, NULL, NULL, &error);
|
|
test_error( error, "Unable to create a simple library" );
|
|
|
|
error = create_single_kernel_helper_create_program(context, &another_program, 1, &another_simple_kernel);
|
|
if( another_program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(another_program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program program_and_archive[2] = { another_program, my_newly_minted_library };
|
|
cl_program fully_linked_program = clLinkProgram(context, 1, &deviceID, "", 2, program_and_archive, NULL, NULL, &error);
|
|
test_error( error, "Unable to create an executable from a binary and a library" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( another_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_minted_library );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( fully_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_execute_after_simple_library_with_link(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program, another_program;
|
|
|
|
log_info("Testing execution after linking a binary with a simple library...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program my_newly_minted_library = clLinkProgram(context, 1, &deviceID, "-create-library", 1, &program, NULL, NULL, &error);
|
|
test_error( error, "Unable to create a simple library" );
|
|
|
|
error = create_single_kernel_helper_create_program(context, &another_program, 1, &another_simple_kernel);
|
|
if( another_program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(another_program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program program_and_archive[2] = { another_program, my_newly_minted_library };
|
|
cl_program fully_linked_program = clLinkProgram(context, 1, &deviceID, "", 2, program_and_archive, NULL, NULL, &error);
|
|
test_error( error, "Unable to create an executable from a binary and a library" );
|
|
|
|
cl_kernel kernel = clCreateKernel(fully_linked_program, "CopyBuffer", &error);
|
|
test_error( error, "Unable to create a simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
cl_kernel another_kernel = clCreateKernel(fully_linked_program, "AnotherCopyBuffer", &error);
|
|
test_error( error, "Unable to create another simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, another_kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseKernel( another_kernel );
|
|
test_error( error, "Unable to release another kernel object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( another_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_minted_library );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( fully_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_two_file_link(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program, another_program;
|
|
|
|
log_info("Testing two file compiling and linking...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
|
|
error = create_single_kernel_helper_create_program(context, &another_program, 1, &another_simple_kernel);
|
|
if( another_program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(another_program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program two_programs[2] = { program, another_program };
|
|
cl_program fully_linked_program = clLinkProgram(context, 1, &deviceID, "", 2, two_programs, NULL, NULL, &error);
|
|
test_error( error, "Unable to create an executable from two binaries" );
|
|
|
|
/* All done! */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( another_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( fully_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_execute_after_two_file_link(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program, another_program;
|
|
|
|
log_info("Testing two file compiling and linking and execution of two kernels afterwards ...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
error = create_single_kernel_helper_create_program(context, &another_program, 1, &another_simple_kernel);
|
|
if( another_program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(another_program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program two_programs[2] = { program, another_program };
|
|
cl_program fully_linked_program = clLinkProgram(context, 1, &deviceID, "", 2, two_programs, NULL, NULL, &error);
|
|
test_error( error, "Unable to create an executable from two binaries" );
|
|
|
|
cl_kernel kernel = clCreateKernel(fully_linked_program, "CopyBuffer", &error);
|
|
test_error( error, "Unable to create a simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
cl_kernel another_kernel = clCreateKernel(fully_linked_program, "AnotherCopyBuffer", &error);
|
|
test_error( error, "Unable to create another simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, another_kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseKernel( another_kernel );
|
|
test_error( error, "Unable to release another kernel object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( another_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( fully_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_execute_after_embedded_header_link(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program, header, simple_program;
|
|
|
|
log_info("Testing execution after embedded header link...\n");
|
|
// we will test execution after compiling and linking with embedded headers
|
|
program = clCreateProgramWithSource(context, 1, &another_simple_kernel_with_header, NULL, &error);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
header = clCreateProgramWithSource(context, 1, &simple_header, NULL, &error);
|
|
if( header == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple header program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 1, &header, &simple_header_name, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program with embedded header" );
|
|
|
|
simple_program = clCreateProgramWithSource(context, 1, &simple_kernel, NULL, &error);
|
|
if( simple_program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(simple_program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program two_programs[2] = { program, simple_program };
|
|
cl_program fully_linked_program = clLinkProgram(context, 1, &deviceID, "", 2, two_programs, NULL, NULL, &error);
|
|
test_error( error, "Unable to create an executable from two binaries, one compiled with embedded header" );
|
|
|
|
cl_kernel kernel = clCreateKernel(fully_linked_program, "CopyBuffer", &error);
|
|
test_error( error, "Unable to create a simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
cl_kernel another_kernel = clCreateKernel(fully_linked_program, "AnotherCopyBuffer", &error);
|
|
test_error( error, "Unable to create another simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, another_kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseKernel( another_kernel );
|
|
test_error( error, "Unable to release another kernel object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( header );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( simple_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( fully_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
#if defined(__APPLE__) || defined(__linux)
|
|
#define _mkdir(x) mkdir(x,S_IRWXU)
|
|
#define _chdir chdir
|
|
#define _rmdir rmdir
|
|
#define _unlink unlink
|
|
#else
|
|
#include <direct.h>
|
|
#endif
|
|
|
|
int test_execute_after_included_header_link(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program, simple_program;
|
|
|
|
log_info("Testing execution after included header link...\n");
|
|
// we will test execution after compiling and linking with included headers
|
|
program = clCreateProgramWithSource(context, 1, &another_simple_kernel_with_header, NULL, &error);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
/* setup */
|
|
#if (defined(__linux__) || defined(__APPLE__)) && (!defined( __ANDROID__ ))
|
|
/* Some tests systems doesn't allow one to write in the test directory */
|
|
if (_chdir("/tmp") != 0) {
|
|
log_error( "ERROR: Unable to remove directory foo/bar! (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
#endif
|
|
if (_mkdir("foo") != 0) {
|
|
log_error( "ERROR: Unable to create directory foo! (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
if (_mkdir("foo/bar") != 0) {
|
|
log_error( "ERROR: Unable to create directory foo/bar! (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
if (_chdir("foo/bar") != 0) {
|
|
log_error( "ERROR: Unable to change to directory foo/bar! (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
FILE* simple_header_file = fopen(simple_header_name, "w");
|
|
if (simple_header_file == NULL) {
|
|
log_error( "ERROR: Unable to create simple header file %s! (in %s:%d)\n", simple_header_name, __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
if (fprintf(simple_header_file, "%s", simple_header) < 0) {
|
|
log_error( "ERROR: Unable to write to simple header file %s! (in %s:%d)\n", simple_header_name, __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
if (fclose(simple_header_file) != 0) {
|
|
log_error( "ERROR: Unable to close simple header file %s! (in %s:%d)\n", simple_header_name, __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
if (_chdir("../..") != 0) {
|
|
log_error( "ERROR: Unable to change to original working directory! (in %s:%d)\n", __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
#if (defined(__linux__) || defined(__APPLE__)) && (!defined( __ANDROID__ ))
|
|
error = clCompileProgram(program, 1, &deviceID, "-I/tmp/foo/bar", 0, NULL, NULL, NULL, NULL);
|
|
#else
|
|
error = clCompileProgram(program, 1, &deviceID, "-Ifoo/bar", 0, NULL, NULL, NULL, NULL);
|
|
#endif
|
|
test_error( error, "Unable to compile a simple program with included header" );
|
|
|
|
/* cleanup */
|
|
if (_chdir("foo/bar") != 0) {
|
|
log_error( "ERROR: Unable to change to directory foo/bar! (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
if (_unlink(simple_header_name) != 0) {
|
|
log_error( "ERROR: Unable to remove simple header file %s! (in %s:%d)\n", simple_header_name, __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
if (_chdir("../..") != 0) {
|
|
log_error( "ERROR: Unable to change to original working directory! (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
if (_rmdir("foo/bar") != 0) {
|
|
log_error( "ERROR: Unable to remove directory foo/bar! (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
if (_rmdir("foo") != 0) {
|
|
log_error( "ERROR: Unable to remove directory foo! (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
simple_program = clCreateProgramWithSource(context, 1, &simple_kernel, NULL, &error);
|
|
if( simple_program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(simple_program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program two_programs[2] = { program, simple_program };
|
|
cl_program fully_linked_program = clLinkProgram(context, 1, &deviceID, "", 2, two_programs, NULL, NULL, &error);
|
|
test_error( error, "Unable to create an executable from two binaries, one compiled with embedded header" );
|
|
|
|
cl_kernel kernel = clCreateKernel(fully_linked_program, "CopyBuffer", &error);
|
|
test_error( error, "Unable to create a simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
cl_kernel another_kernel = clCreateKernel(fully_linked_program, "AnotherCopyBuffer", &error);
|
|
test_error( error, "Unable to create another simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, another_kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseKernel( another_kernel );
|
|
test_error( error, "Unable to release another kernel object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( simple_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( fully_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_program_binary_type(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
int error;
|
|
cl_program program, another_program, program_with_binary, fully_linked_program_with_binary;
|
|
cl_program_binary_type program_type = -1;
|
|
size_t size;
|
|
size_t binarySize;
|
|
unsigned char *binary;
|
|
|
|
log_info("Testing querying of program binary type...\n");
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
error = clGetProgramBuildInfo (program, deviceID, CL_PROGRAM_BINARY_TYPE, sizeof(cl_program_binary_type), &program_type, NULL);
|
|
test_error( error, "Unable to get program binary type" );
|
|
if (program_type != CL_PROGRAM_BINARY_TYPE_COMPILED_OBJECT)
|
|
{
|
|
log_error( "ERROR: Expected program type of a just compiled program to be CL_PROGRAM_BINARY_TYPE_COMPILED_OBJECT (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
program_type = -1;
|
|
|
|
// Get the size of the resulting binary (only one device)
|
|
error = clGetProgramInfo( program, CL_PROGRAM_BINARY_SIZES, sizeof( binarySize ), &binarySize, NULL );
|
|
test_error( error, "Unable to get binary size" );
|
|
|
|
// Sanity check
|
|
if( binarySize == 0 )
|
|
{
|
|
log_error( "ERROR: Binary size of program is zero (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
// Create a buffer and get the actual binary
|
|
{
|
|
binary = (unsigned char*)malloc(sizeof(unsigned char)*binarySize);
|
|
if (binary == NULL) {
|
|
log_error( "ERROR: Unable to allocate binary character array with %lu characters! (in %s:%d)\n", binarySize, __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
unsigned char *buffers[ 1 ] = { binary };
|
|
cl_int loadErrors[ 1 ];
|
|
|
|
// Do another sanity check here first
|
|
size_t size;
|
|
error = clGetProgramInfo( program, CL_PROGRAM_BINARIES, 0, NULL, &size );
|
|
test_error( error, "Unable to get expected size of binaries array" );
|
|
if( size != sizeof( buffers ) )
|
|
{
|
|
log_error( "ERROR: Expected size of binaries array in clGetProgramInfo is incorrect (should be %d, got %d) (in %s:%d)\n", (int)sizeof( buffers ), (int)size, __FILE__, __LINE__ );
|
|
free(binary);
|
|
return -1;
|
|
}
|
|
|
|
error = clGetProgramInfo( program, CL_PROGRAM_BINARIES, sizeof( buffers ), &buffers, NULL );
|
|
test_error( error, "Unable to get program binary" );
|
|
|
|
// use clCreateProgramWithBinary
|
|
program_with_binary = clCreateProgramWithBinary(context, 1, &deviceID, &binarySize, (const unsigned char**)buffers, loadErrors, &error);
|
|
test_error( error, "Unable to create program with binary" );
|
|
|
|
error = clGetProgramBuildInfo (program_with_binary, deviceID, CL_PROGRAM_BINARY_TYPE, sizeof(cl_program_binary_type), &program_type, NULL);
|
|
test_error( error, "Unable to get program binary type" );
|
|
if (program_type != CL_PROGRAM_BINARY_TYPE_COMPILED_OBJECT)
|
|
{
|
|
log_error( "ERROR: Expected program type of a program created from compiled object to be CL_PROGRAM_BINARY_TYPE_COMPILED_OBJECT (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
program_type = -1;
|
|
free(binary);
|
|
}
|
|
|
|
cl_program my_newly_minted_library = clLinkProgram(context, 1, &deviceID, "-create-library", 1, &program_with_binary, NULL, NULL, &error);
|
|
test_error( error, "Unable to create a simple library" );
|
|
error = clGetProgramBuildInfo (my_newly_minted_library, deviceID, CL_PROGRAM_BINARY_TYPE, sizeof(cl_program_binary_type), &program_type, NULL);
|
|
test_error( error, "Unable to get program binary type" );
|
|
if (program_type != CL_PROGRAM_BINARY_TYPE_LIBRARY)
|
|
{
|
|
log_error( "ERROR: Expected program type of a just linked library to be CL_PROGRAM_BINARY_TYPE_LIBRARY (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
program_type = -1;
|
|
|
|
// Get the size of the resulting library (only one device)
|
|
error = clGetProgramInfo( my_newly_minted_library, CL_PROGRAM_BINARY_SIZES, sizeof( binarySize ), &binarySize, NULL );
|
|
test_error( error, "Unable to get binary size" );
|
|
|
|
// Sanity check
|
|
if( binarySize == 0 )
|
|
{
|
|
log_error( "ERROR: Binary size of program is zero (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
// Create a buffer and get the actual binary
|
|
binary = (unsigned char*)malloc(sizeof(unsigned char)*binarySize);
|
|
if (binary == NULL) {
|
|
log_error( "ERROR: Unable to allocate binary character array with %lu characters! (in %s:%d)\n", binarySize, __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
|
|
unsigned char *buffers[ 1 ] = { binary };
|
|
cl_int loadErrors[ 1 ];
|
|
|
|
// Do another sanity check here first
|
|
error = clGetProgramInfo( my_newly_minted_library, CL_PROGRAM_BINARIES, 0, NULL, &size );
|
|
test_error( error, "Unable to get expected size of binaries array" );
|
|
if( size != sizeof( buffers ) )
|
|
{
|
|
log_error( "ERROR: Expected size of binaries array in clGetProgramInfo is incorrect (should be %d, got %d) (in %s:%d)\n", (int)sizeof( buffers ), (int)size, __FILE__, __LINE__ );
|
|
free(binary);
|
|
return -1;
|
|
}
|
|
|
|
error = clGetProgramInfo( my_newly_minted_library, CL_PROGRAM_BINARIES, sizeof( buffers ), &buffers, NULL );
|
|
test_error( error, "Unable to get program binary" );
|
|
|
|
// use clCreateProgramWithBinary
|
|
cl_program library_with_binary = clCreateProgramWithBinary(context, 1, &deviceID, &binarySize, (const unsigned char**)buffers, loadErrors, &error);
|
|
test_error( error, "Unable to create program with binary" );
|
|
error = clGetProgramBuildInfo (library_with_binary, deviceID, CL_PROGRAM_BINARY_TYPE, sizeof(cl_program_binary_type), &program_type, NULL);
|
|
test_error( error, "Unable to get program binary type" );
|
|
if (program_type != CL_PROGRAM_BINARY_TYPE_LIBRARY)
|
|
{
|
|
log_error( "ERROR: Expected program type of a library loaded with binary to be CL_PROGRAM_BINARY_TYPE_LIBRARY (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
program_type = -1;
|
|
free(binary);
|
|
|
|
error = create_single_kernel_helper_create_program(context, &another_program, 1, &another_simple_kernel);
|
|
if( another_program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clCompileProgram(another_program, 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
cl_program program_and_archive[2] = { another_program, library_with_binary };
|
|
cl_program fully_linked_program = clLinkProgram(context, 1, &deviceID, "", 2, program_and_archive, NULL, NULL, &error);
|
|
test_error( error, "Unable to create an executable from a binary and a library" );
|
|
|
|
error = clGetProgramBuildInfo (fully_linked_program, deviceID, CL_PROGRAM_BINARY_TYPE, sizeof(cl_program_binary_type), &program_type, NULL);
|
|
test_error( error, "Unable to get program binary type" );
|
|
if (program_type != CL_PROGRAM_BINARY_TYPE_EXECUTABLE)
|
|
{
|
|
log_error( "ERROR: Expected program type of a newly build executable to be CL_PROGRAM_BINARY_TYPE_EXECUTABLE (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
program_type = -1;
|
|
|
|
// Get the size of the resulting binary (only one device)
|
|
error = clGetProgramInfo( fully_linked_program, CL_PROGRAM_BINARY_SIZES, sizeof( binarySize ), &binarySize, NULL );
|
|
test_error( error, "Unable to get binary size" );
|
|
|
|
// Sanity check
|
|
if( binarySize == 0 )
|
|
{
|
|
log_error( "ERROR: Binary size of program is zero (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
// Create a buffer and get the actual binary
|
|
{
|
|
binary = (unsigned char*)malloc(sizeof(unsigned char)*binarySize);
|
|
if (binary == NULL) {
|
|
log_error( "ERROR: Unable to allocate binary character array with %lu characters! (in %s:%d)\n", binarySize, __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
unsigned char *buffers[ 1 ] = { binary };
|
|
cl_int loadErrors[ 1 ];
|
|
|
|
// Do another sanity check here first
|
|
size_t size;
|
|
error = clGetProgramInfo( fully_linked_program, CL_PROGRAM_BINARIES, 0, NULL, &size );
|
|
test_error( error, "Unable to get expected size of binaries array" );
|
|
if( size != sizeof( buffers ) )
|
|
{
|
|
log_error( "ERROR: Expected size of binaries array in clGetProgramInfo is incorrect (should be %d, got %d) (in %s:%d)\n", (int)sizeof( buffers ), (int)size, __FILE__, __LINE__ );
|
|
free(binary);
|
|
return -1;
|
|
}
|
|
|
|
error = clGetProgramInfo( fully_linked_program, CL_PROGRAM_BINARIES, sizeof( buffers ), &buffers, NULL );
|
|
test_error( error, "Unable to get program binary" );
|
|
|
|
// use clCreateProgramWithBinary
|
|
fully_linked_program_with_binary = clCreateProgramWithBinary(context, 1, &deviceID, &binarySize, (const unsigned char**)buffers, loadErrors, &error);
|
|
test_error( error, "Unable to create program with binary" );
|
|
|
|
error = clGetProgramBuildInfo (fully_linked_program_with_binary, deviceID, CL_PROGRAM_BINARY_TYPE, sizeof(cl_program_binary_type), &program_type, NULL);
|
|
test_error( error, "Unable to get program binary type" );
|
|
if (program_type != CL_PROGRAM_BINARY_TYPE_EXECUTABLE)
|
|
{
|
|
log_error( "ERROR: Expected program type of a program created from a fully linked executable binary to be CL_PROGRAM_BINARY_TYPE_EXECUTABLE (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
program_type = -1;
|
|
free(binary);
|
|
}
|
|
|
|
error = clBuildProgram(fully_linked_program_with_binary, 1, &deviceID, NULL, NULL, NULL);
|
|
test_error( error, "Unable to build a simple program" );
|
|
|
|
cl_kernel kernel = clCreateKernel(fully_linked_program_with_binary, "CopyBuffer", &error);
|
|
test_error( error, "Unable to create a simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
cl_kernel another_kernel = clCreateKernel(fully_linked_program_with_binary, "AnotherCopyBuffer", &error);
|
|
test_error( error, "Unable to create another simple kernel" );
|
|
|
|
error = verifyCopyBuffer(context, queue, another_kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseKernel( another_kernel );
|
|
test_error( error, "Unable to release another kernel object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
/* Oh, one more thing. Steve Jobs and apparently Herb Sutter. The question is "Who is copying whom?" */
|
|
error = create_single_kernel_helper_create_program(context, &program, 1, &simple_kernel);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create a simple test program! (%s in %s:%d)\n", IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clBuildProgram(program, 1, &deviceID, NULL, NULL, NULL);
|
|
test_error( error, "Unable to build a simple program" );
|
|
error = clGetProgramBuildInfo (program, deviceID, CL_PROGRAM_BINARY_TYPE, sizeof(cl_program_binary_type), &program_type, NULL);
|
|
test_error( error, "Unable to get program binary type" );
|
|
if (program_type != CL_PROGRAM_BINARY_TYPE_EXECUTABLE)
|
|
{
|
|
log_error( "ERROR: Expected program type of a program created from compiled object to be CL_PROGRAM_BINARY_TYPE_EXECUTABLE (in %s:%d)\n", __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
program_type = -1;
|
|
|
|
/* All's well that ends well. William Shakespeare */
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( another_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_minted_library );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( library_with_binary );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( fully_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( fully_linked_program_with_binary );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( program_with_binary );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
volatile int compileNotificationSent;
|
|
|
|
void CL_CALLBACK test_notify_compile_complete( cl_program program, void *userData )
|
|
{
|
|
if( userData == NULL || strcmp( (char *)userData, "compilation" ) != 0 )
|
|
{
|
|
log_error( "ERROR: User data passed in to compile notify function was not correct! (in %s:%d)\n", __FILE__, __LINE__ );
|
|
compileNotificationSent = -1;
|
|
}
|
|
else
|
|
compileNotificationSent = 1;
|
|
log_info( "\n <-- program successfully compiled\n" );
|
|
}
|
|
|
|
volatile int libraryCreationNotificationSent;
|
|
|
|
void CL_CALLBACK test_notify_create_library_complete( cl_program program, void *userData )
|
|
{
|
|
if( userData == NULL || strcmp( (char *)userData, "create library" ) != 0 )
|
|
{
|
|
log_error( "ERROR: User data passed in to library creation notify function was not correct! (in %s:%d)\n", __FILE__, __LINE__ );
|
|
libraryCreationNotificationSent = -1;
|
|
}
|
|
else
|
|
libraryCreationNotificationSent = 1;
|
|
log_info( "\n <-- library successfully created\n" );
|
|
}
|
|
|
|
volatile int linkNotificationSent;
|
|
|
|
void CL_CALLBACK test_notify_link_complete( cl_program program, void *userData )
|
|
{
|
|
if( userData == NULL || strcmp( (char *)userData, "linking" ) != 0 )
|
|
{
|
|
log_error( "ERROR: User data passed in to link notify function was not correct! (in %s:%d)\n", __FILE__, __LINE__ );
|
|
linkNotificationSent = -1;
|
|
}
|
|
else
|
|
linkNotificationSent = 1;
|
|
log_info( "\n <-- program successfully linked\n" );
|
|
}
|
|
|
|
int test_large_compile_and_link_status_options_log(cl_context context, cl_device_id deviceID, cl_command_queue queue, unsigned int numLines)
|
|
{
|
|
int error;
|
|
cl_program program;
|
|
cl_program * simple_kernels;
|
|
const char **lines;
|
|
unsigned int i;
|
|
char buffer[MAX_LINE_SIZE_IN_PROGRAM];
|
|
char *compile_log;
|
|
char *compile_options;
|
|
char *library_log;
|
|
char *library_options;
|
|
char *linking_log;
|
|
char *linking_options;
|
|
cl_build_status status;
|
|
size_t size_ret;
|
|
|
|
compileNotificationSent = libraryCreationNotificationSent = linkNotificationSent = 0;
|
|
|
|
simple_kernels = (cl_program*)malloc(numLines*sizeof(cl_program));
|
|
if (simple_kernels == NULL) {
|
|
log_error( "ERROR: Unable to allocate kernels array with %d kernels! (in %s:%d)\n", numLines, __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
/* First, allocate the array for our line pointers */
|
|
lines = (const char **)malloc( (2*numLines + 2) * sizeof( const char * ) );
|
|
if (lines == NULL) {
|
|
log_error( "ERROR: Unable to allocate lines array with %d lines! (in %s:%d)\n", (2*numLines + 2), __FILE__, __LINE__);
|
|
return -1;
|
|
}
|
|
|
|
for(i = 0; i < numLines; i++)
|
|
{
|
|
sprintf(buffer, composite_kernel_extern_template, i);
|
|
lines[i] = _strdup(buffer);
|
|
}
|
|
/* First and last lines are easy */
|
|
lines[ numLines ] = composite_kernel_start;
|
|
lines[ 2*numLines + 1] = composite_kernel_end;
|
|
|
|
/* Fill the rest with templated kernels */
|
|
for(i = numLines + 1; i < 2*numLines + 1; i++ )
|
|
{
|
|
sprintf(buffer, composite_kernel_template, i - numLines - 1);
|
|
lines[ i ] = _strdup(buffer);
|
|
}
|
|
|
|
/* Try to create a program with these lines */
|
|
error = create_single_kernel_helper_create_program(context, &program, 2 * numLines + 2, lines);
|
|
if( program == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create long test program with %d lines! (%s) (in %s:%d)\n", numLines, IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
/* Lets check that the compilation status is CL_BUILD_NONE */
|
|
error = clGetProgramBuildInfo( program, deviceID, CL_PROGRAM_BUILD_STATUS, sizeof( status ), &status, NULL );
|
|
test_error( error, "Unable to get program compile status" );
|
|
if (status != CL_BUILD_NONE)
|
|
{
|
|
log_error( "ERROR: Expected compile status to be CL_BUILD_NONE prior to the beginning of the compilation! (status: %d in %s:%d)\n", (int)status, __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
/* Compile it */
|
|
error = clCompileProgram(program, 1, &deviceID, NULL, 0, NULL, NULL, test_notify_compile_complete, (void *)"compilation");
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
/* Wait for compile to complete (just keep polling, since we're just a test */
|
|
error = clGetProgramBuildInfo( program, deviceID, CL_PROGRAM_BUILD_STATUS, sizeof( status ), &status, NULL );
|
|
test_error( error, "Unable to get program compile status" );
|
|
|
|
while( (int)status == CL_BUILD_IN_PROGRESS )
|
|
{
|
|
log_info( "\n -- still waiting for compile... (status is %d)", status );
|
|
sleep( 1 );
|
|
error = clGetProgramBuildInfo( program, deviceID, CL_PROGRAM_BUILD_STATUS, sizeof( status ), &status, NULL );
|
|
test_error( error, "Unable to get program compile status" );
|
|
}
|
|
if( status != CL_BUILD_SUCCESS )
|
|
{
|
|
log_error( "ERROR: compile failed! (status: %d in %s:%d)\n", (int)status, __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
error = clGetProgramBuildInfo( program, deviceID, CL_PROGRAM_BUILD_LOG, 0, NULL, &size_ret );
|
|
test_error( error, "Device failed to return compile log size" );
|
|
compile_log = (char *)malloc(size_ret);
|
|
error = clGetProgramBuildInfo( program, deviceID, CL_PROGRAM_BUILD_LOG, size_ret, compile_log, NULL );
|
|
if (error != CL_SUCCESS){
|
|
log_error("Device failed to return a compile log (in %s:%d)\n", __FILE__, __LINE__);
|
|
test_error(error, "clGetProgramBuildInfo CL_PROGRAM_BUILD_LOG failed");
|
|
}
|
|
log_info("BUILD LOG: %s\n", compile_log);
|
|
free(compile_log);
|
|
|
|
error = clGetProgramBuildInfo( program, deviceID, CL_PROGRAM_BUILD_OPTIONS, 0, NULL, &size_ret );
|
|
test_error(error, "Device failed to return compile options size");
|
|
compile_options = (char *)malloc(size_ret);
|
|
error = clGetProgramBuildInfo( program, deviceID, CL_PROGRAM_BUILD_OPTIONS, size_ret, compile_options, NULL );
|
|
test_error(error, "Device failed to return compile options.\nclGetProgramBuildInfo CL_PROGRAM_BUILD_OPTIONS failed");
|
|
|
|
log_info("BUILD OPTIONS: %s\n", compile_options);
|
|
free(compile_options);
|
|
|
|
/* Create and compile templated kernels */
|
|
for( i = 0; i < numLines; i++)
|
|
{
|
|
sprintf(buffer, simple_kernel_template, i);
|
|
const char* kernel_source = _strdup(buffer);
|
|
error = create_single_kernel_helper_create_program(context, &simple_kernels[i], 1, &kernel_source);
|
|
if( simple_kernels[i] == NULL || error != CL_SUCCESS )
|
|
{
|
|
log_error( "ERROR: Unable to create long test program with %d lines! (%s in %s:%d)", numLines, IGetErrorString( error ), __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
/* Compile it */
|
|
error = clCompileProgram(simple_kernels[i], 1, &deviceID, NULL, 0, NULL, NULL, NULL, NULL);
|
|
test_error( error, "Unable to compile a simple program" );
|
|
|
|
free((void*)kernel_source);
|
|
}
|
|
|
|
/* Create library out of compiled templated kernels */
|
|
cl_program my_newly_minted_library = clLinkProgram(context, 1, &deviceID, "-create-library", numLines, simple_kernels, test_notify_create_library_complete, (void *)"create library", &error);
|
|
test_error( error, "Unable to create a multi-line library" );
|
|
|
|
/* Wait for library creation to complete (just keep polling, since we're just a test */
|
|
error = clGetProgramBuildInfo( my_newly_minted_library, deviceID, CL_PROGRAM_BUILD_STATUS, sizeof( status ), &status, NULL );
|
|
test_error( error, "Unable to get library creation link status" );
|
|
|
|
while( (int)status == CL_BUILD_IN_PROGRESS )
|
|
{
|
|
log_info( "\n -- still waiting for library creation... (status is %d)", status );
|
|
sleep( 1 );
|
|
error = clGetProgramBuildInfo( my_newly_minted_library, deviceID, CL_PROGRAM_BUILD_STATUS, sizeof( status ), &status, NULL );
|
|
test_error( error, "Unable to get library creation link status" );
|
|
}
|
|
if( status != CL_BUILD_SUCCESS )
|
|
{
|
|
log_error( "ERROR: library creation failed! (status: %d in %s:%d)\n", (int)status, __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
error = clGetProgramBuildInfo( my_newly_minted_library, deviceID, CL_PROGRAM_BUILD_LOG, 0, NULL, &size_ret );
|
|
test_error( error, "Device failed to return a library creation log size" );
|
|
library_log = (char *)malloc(size_ret);
|
|
error = clGetProgramBuildInfo( my_newly_minted_library, deviceID, CL_PROGRAM_BUILD_LOG, size_ret, library_log, NULL );
|
|
if (error != CL_SUCCESS) {
|
|
log_error("Device failed to return a library creation log (in %s:%d)\n", __FILE__, __LINE__);
|
|
test_error(error, "clGetProgramBuildInfo CL_PROGRAM_BUILD_LOG failed");
|
|
}
|
|
log_info("CREATE LIBRARY LOG: %s\n", library_log);
|
|
free(library_log);
|
|
|
|
error = clGetProgramBuildInfo( my_newly_minted_library, deviceID, CL_PROGRAM_BUILD_OPTIONS, 0, NULL, &size_ret );
|
|
test_error(error, "Device failed to return library creation options size");
|
|
library_options = (char *)malloc(size_ret);
|
|
error = clGetProgramBuildInfo( my_newly_minted_library, deviceID, CL_PROGRAM_BUILD_OPTIONS, size_ret, library_options, NULL );
|
|
test_error(error, "Device failed to return library creation options.\nclGetProgramBuildInfo CL_PROGRAM_BUILD_OPTIONS failed");
|
|
|
|
log_info("CREATE LIBRARY OPTIONS: %s\n", library_options);
|
|
free(library_options);
|
|
|
|
/* Link the program that calls the kernels and the library that contains them */
|
|
cl_program programs[2] = { program, my_newly_minted_library };
|
|
cl_program my_newly_linked_program = clLinkProgram(context, 1, &deviceID, NULL, 2, programs, test_notify_link_complete, (void *)"linking", &error);
|
|
test_error( error, "Unable to link a program with a library" );
|
|
|
|
/* Wait for linking to complete (just keep polling, since we're just a test */
|
|
error = clGetProgramBuildInfo( my_newly_linked_program, deviceID, CL_PROGRAM_BUILD_STATUS, sizeof( status ), &status, NULL );
|
|
test_error( error, "Unable to get program link status" );
|
|
|
|
while( (int)status == CL_BUILD_IN_PROGRESS )
|
|
{
|
|
log_info( "\n -- still waiting for program linking... (status is %d)", status );
|
|
sleep( 1 );
|
|
error = clGetProgramBuildInfo( my_newly_linked_program, deviceID, CL_PROGRAM_BUILD_STATUS, sizeof( status ), &status, NULL );
|
|
test_error( error, "Unable to get program link status" );
|
|
}
|
|
if( status != CL_BUILD_SUCCESS )
|
|
{
|
|
log_error( "ERROR: program linking failed! (status: %d in %s:%d)\n", (int)status, __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
error = clGetProgramBuildInfo( my_newly_linked_program, deviceID, CL_PROGRAM_BUILD_LOG, 0, NULL, &size_ret );
|
|
test_error( error, "Device failed to return a linking log size" );
|
|
linking_log = (char *)malloc(size_ret);
|
|
error = clGetProgramBuildInfo( my_newly_linked_program, deviceID, CL_PROGRAM_BUILD_LOG, size_ret, linking_log, NULL );
|
|
if (error != CL_SUCCESS){
|
|
log_error("Device failed to return a linking log (in %s:%d).\n", __FILE__, __LINE__);
|
|
test_error(error, "clGetProgramBuildInfo CL_PROGRAM_BUILD_LOG failed");
|
|
}
|
|
log_info("BUILDING LOG: %s\n", linking_log);
|
|
free(linking_log);
|
|
|
|
error = clGetProgramBuildInfo( my_newly_linked_program, deviceID, CL_PROGRAM_BUILD_OPTIONS, 0, NULL, &size_ret );
|
|
test_error(error, "Device failed to return linking options size");
|
|
linking_options = (char *)malloc(size_ret);
|
|
error = clGetProgramBuildInfo( my_newly_linked_program, deviceID, CL_PROGRAM_BUILD_OPTIONS, size_ret, linking_options, NULL );
|
|
test_error(error, "Device failed to return linking options.\nclGetProgramBuildInfo CL_PROGRAM_BUILD_OPTIONS failed");
|
|
|
|
log_info("BUILDING OPTIONS: %s\n", linking_options);
|
|
free(linking_options);
|
|
|
|
// Create the composite kernel
|
|
cl_kernel kernel = clCreateKernel(my_newly_linked_program, "CompositeKernel", &error);
|
|
test_error( error, "Unable to create a composite kernel" );
|
|
|
|
// Run the composite kernel and verify the results
|
|
error = verifyCopyBuffer(context, queue, kernel);
|
|
if (error != CL_SUCCESS)
|
|
return error;
|
|
|
|
/* All done! */
|
|
error = clReleaseKernel( kernel );
|
|
test_error( error, "Unable to release kernel object" );
|
|
|
|
error = clReleaseProgram( program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
for(i = 0; i < numLines; i++)
|
|
{
|
|
free( (void*)lines[i] );
|
|
free( (void*)lines[i+numLines+1] );
|
|
}
|
|
free( lines );
|
|
|
|
for(i = 0; i < numLines; i++)
|
|
{
|
|
error = clReleaseProgram( simple_kernels[i] );
|
|
test_error( error, "Unable to release program object" );
|
|
}
|
|
free( simple_kernels );
|
|
|
|
error = clReleaseProgram( my_newly_minted_library );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
error = clReleaseProgram( my_newly_linked_program );
|
|
test_error( error, "Unable to release program object" );
|
|
|
|
return 0;
|
|
}
|
|
|
|
int test_compile_and_link_status_options_log(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
|
|
{
|
|
unsigned int toTest[] = { 256, 0 }; //512, 1024, 8192, 16384, 32768, 0 };
|
|
unsigned int i;
|
|
|
|
log_info( "Testing Compile and Link Status, Options and Logging ...this might take awhile...\n" );
|
|
|
|
for( i = 0; toTest[ i ] != 0; i++ )
|
|
{
|
|
log_info( " %d...\n", toTest[ i ] );
|
|
|
|
#if defined(_WIN32)
|
|
clock_t start = clock();
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
timeval time1, time2;
|
|
gettimeofday(&time1, NULL);
|
|
#endif
|
|
|
|
if( test_large_compile_and_link_status_options_log( context, deviceID, queue, toTest[ i ] ) != 0 )
|
|
{
|
|
log_error( "ERROR: large program compilation, linking, status, options and logging test failed for %d lines! (in %s:%d)\n", toTest[ i ], __FILE__, __LINE__ );
|
|
return -1;
|
|
}
|
|
|
|
#if defined(_WIN32)
|
|
clock_t end = clock();
|
|
log_perf( (float)( end - start ) / (float)CLOCKS_PER_SEC, false, "clock() time in secs", "%d lines", toTest[i] );
|
|
#elif defined(__linux__) || defined(__APPLE__)
|
|
gettimeofday(&time2, NULL);
|
|
log_perf( (float)(float)(time2.tv_sec - time1.tv_sec) + 1.0e-6 * (time2.tv_usec - time1.tv_usec) , false, "wall time in secs", "%d lines", toTest[i] );
|
|
#endif
|
|
}
|
|
|
|
return 0;
|
|
}
|