You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1242 lines
41 KiB

//
// Copyright (c) 2017 The Khronos Group Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
#include "helpers.h"
#include "gl_headers.h"
#include "CL/cl_half.h"
#define CHECK_ERROR()\
{GLint __error = glGetError(); if(__error) {log_error( "GL ERROR: %s!\n", gluErrorString( err ));}}
#if defined(__linux__) || defined(GL_ES_VERSION_2_0)
// On linux we dont link to GLU library to avoid comaptibility issues with
// libstdc++
// FIXME: Implement this
const GLubyte* gluErrorString (GLenum error)
{
const char* gl_Error = "OpenGL Error";
return (const GLubyte*)gl_Error;
}
#endif
static void DrawQuad(void);
void * CreateGLTexture2D( size_t width, size_t height,
GLenum target, GLenum glFormat,
GLenum internalFormat, GLenum glType,
ExplicitType type, GLuint *outTextureID,
int *outError, bool allocateMem, MTdata d )
{
*outError = 0;
GLenum err = 0;
char * buffer = (char *)CreateRandomData(type, width * height * 4, d);
glGenTextures( 1, outTextureID );
glBindTexture( get_base_gl_target( target ), *outTextureID );
err = glGetError();
if( err != GL_NO_ERROR )
{
log_error( "ERROR: Failed to create GL texture object: %s!\n", gluErrorString( err ));
*outError = -1;
free( buffer );
return NULL;
}
#ifndef GL_ES_VERSION_2_0
glTexEnvi( GL_TEXTURE_ENV, GL_TEXTURE_ENV_MODE, GL_REPLACE );
#endif
glTexParameteri( get_base_gl_target( target ), GL_TEXTURE_MIN_FILTER, GL_NEAREST );
glTexParameteri( get_base_gl_target( target ), GL_TEXTURE_MAG_FILTER, GL_NEAREST );
if( get_base_gl_target( target ) == GL_TEXTURE_CUBE_MAP )
{
char * temp = (char *)malloc(width * height * 4 * get_explicit_type_size( type ) * sizeof(cl_char));
if(allocateMem)
memcpy( temp, buffer, width * height * 4 * get_explicit_type_size( type ) );
else
memset( temp, 0, width * height * 4 * get_explicit_type_size( type ) );
glTexImage2D( GL_TEXTURE_CUBE_MAP_POSITIVE_X, 0, internalFormat, (GLsizei)width, (GLsizei)height, 0, glFormat, glType, temp );
glTexImage2D( GL_TEXTURE_CUBE_MAP_POSITIVE_Y, 0, internalFormat, (GLsizei)width, (GLsizei)height, 0, glFormat, glType, temp );
glTexImage2D( GL_TEXTURE_CUBE_MAP_POSITIVE_Z, 0, internalFormat, (GLsizei)width, (GLsizei)height, 0, glFormat, glType, temp );
glTexImage2D( GL_TEXTURE_CUBE_MAP_NEGATIVE_X, 0, internalFormat, (GLsizei)width, (GLsizei)height, 0, glFormat, glType, temp );
glTexImage2D( GL_TEXTURE_CUBE_MAP_NEGATIVE_Y, 0, internalFormat, (GLsizei)width, (GLsizei)height, 0, glFormat, glType, temp );
glTexImage2D( GL_TEXTURE_CUBE_MAP_NEGATIVE_Z, 0, internalFormat, (GLsizei)width, (GLsizei)height, 0, glFormat, glType, temp );
free(temp);
}
else
{
#ifdef GLES_DEBUG
log_info("- glTexImage2D : %s : %s : %d : %d : %s : %s\n",
GetGLTargetName(target),
GetGLFormatName(internalFormat),
width, height,
GetGLFormatName(glFormat),
GetGLTypeName(glType));
DumpGLBuffer(glType, width, height, buffer);
#endif
glTexImage2D( get_base_gl_target(target), 0, internalFormat, (GLsizei)width, (GLsizei)height, 0, glFormat, glType, buffer );
}
err = glGetError();
if( err != GL_NO_ERROR )
{
/** In section 9.8.3.1. of the CL 1.1. spec it says that:
*
* If a GL texture object with an internal format from table 9.4 is successfully created by
* OpenGL, then there is guaranteed to be a mapping to one of the corresponding CL image
* format(s) in that table.
*
* Notice that some of the formats in table 9.4 are not supported in OpenGL ES 2.0.
*/
log_info( "Warning: Skipping %s : %s : %d : %d : %s : %s : because glTexImage2D returned %s\n",
GetGLTargetName(target),
GetGLFormatName(internalFormat),
(int)(width), (int)(height),
GetGLFormatName(glFormat),
GetGLTypeName(glType),
gluErrorString( err ));
glDeleteTextures( 1, outTextureID );
*outTextureID = 0;
*outError = 0;
free( buffer );
err = glGetError();
return NULL;
}
#ifdef GLES_DEBUG
memset(buffer, 0, width * height * 4 * get_explicit_type_size( type ));
log_info("- glGetTexImage : %s : %s : %s\n",
GetGLTargetName(target),
GetGLFormatName(glFormat),
GetGLTypeName(glType));
glGetTexImage(target, 0, glFormat, glType, buffer);
DumpGLBuffer(type, width, height, buffer);
err = glGetError();
if( err != GL_NO_ERROR )
{
log_error( "ERROR: Unable to read data from glGetTexImage : %s : %s : %s : Error %s\n",
GetGLTargetName(target),
GetGLFormatName(glFormat),
GetGLTypeName(glType),
gluErrorString( err ));
return NULL;
}
#endif
if( !allocateMem )
{
free( buffer );
return NULL;
}
#ifndef GL_ES_VERSION_2_0
if( glType == GL_UNSIGNED_INT_8_8_8_8_REV && glFormat == GL_BGRA && allocateMem )
{
// Reverse and reorder to validate since in the
// kernel the read_imagef() call always returns RGBA
cl_uchar *p = (cl_uchar *)buffer;
for( size_t i = 0; i < width * height; i++ )
{
cl_uchar uc0 = p[i * 4 + 0];
cl_uchar uc1 = p[i * 4 + 1];
cl_uchar uc2 = p[i * 4 + 2];
cl_uchar uc3 = p[i * 4 + 3];
p[ i * 4 + 0 ] = uc2;
p[ i * 4 + 1 ] = uc1;
p[ i * 4 + 2 ] = uc0;
p[ i * 4 + 3 ] = uc3;
}
}
#endif
return buffer;
}
void * CreateGLTexture3D( size_t width, size_t height, size_t depth,
GLenum target, GLenum glFormat,
GLenum internalFormat, GLenum glType,
ExplicitType type, GLuint *outTextureID,
int *outError, MTdata d, bool allocateMem)
{
*outError = 0;
char * buffer = (char *)create_random_data( type, d, width * height * depth * 4 );
if( type == kFloat && allocateMem )
{
// Re-fill the created buffer to just have [0-1] floats, since that's what it'd expect
cl_float *p = (cl_float *)buffer;
for( size_t i = 0; i < width * height * depth * 4; i++ )
{
p[ i ] = (float) genrand_real1( d );
}
}
else if( !allocateMem )
memset( buffer, 0, width * height * depth * 4 * get_explicit_type_size( type ) );
glGenTextures( 1, outTextureID );
glBindTexture( target, *outTextureID );
#ifndef GL_ES_VERSION_2_0
glTexEnvi( GL_TEXTURE_ENV, GL_TEXTURE_ENV_MODE, GL_REPLACE );
#endif
glTexParameteri( target, GL_TEXTURE_MIN_FILTER, GL_NEAREST );
glTexParameteri( target, GL_TEXTURE_MAG_FILTER, GL_NEAREST );
glGetError();
glTexImage3D( target, 0, internalFormat, (GLsizei)width, (GLsizei)height, (GLsizei)depth, 0, glFormat, glType, buffer );
GLenum err = glGetError();
if( err != GL_NO_ERROR )
{
/** In section 9.8.3.1. of the CL 1.1. spec it says that:
*
* If a GL texture object with an internal format from table 9.4 is successfully created by
* OpenGL, then there is guaranteed to be a mapping to one of the corresponding CL image
* format(s) in that table.
*
* Notice that some of the formats in table 9.4 are not supported in OpenGL ES 2.0.
*/
log_info( "Warning: Skipping %s : %s : %d : %d : %s : %s : because glTexImage3D returned %s\n",
GetGLTargetName(target),
GetGLFormatName(internalFormat),
(int)(width), (int)(height),
GetGLFormatName(glFormat),
GetGLTypeName(glType),
gluErrorString( err ));
*outError = 0;
delete[] buffer;
return NULL;
}
if( !allocateMem )
{
delete [] buffer;
return NULL;
}
#ifndef GL_ES_VERSION_2_0
if( glType == GL_UNSIGNED_INT_8_8_8_8_REV && glFormat == GL_BGRA && allocateMem )
{
// Reverse and reorder to validate since in the
// kernel the read_imagef() call always returns RGBA
cl_uchar *p = (cl_uchar *)buffer;
for( size_t i = 0; i < width * height * depth; i++ )
{
cl_uchar uc0 = p[i * 4 + 0];
cl_uchar uc1 = p[i * 4 + 1];
cl_uchar uc2 = p[i * 4 + 2];
cl_uchar uc3 = p[i * 4 + 3];
p[ i * 4 + 0 ] = uc2;
p[ i * 4 + 1 ] = uc1;
p[ i * 4 + 2 ] = uc0;
p[ i * 4 + 3 ] = uc3;
}
}
#endif
return buffer;
}
void * ReadGLTexture( GLenum glTarget, GLuint glTexture,
GLenum glFormat, GLenum glInternalFormat,
GLenum glType, ExplicitType typeToReadAs,
size_t outWidth, size_t outHeight )
{
// Read results from the GL texture
glBindTexture(get_base_gl_target(glTarget), glTexture);
GLint realWidth, realHeight;
GLint realInternalFormat;
GLenum readBackFormat = GL_RGBA;
GLenum readBackType = glType;
glFramebufferWrapper glFramebuffer;
glRenderbufferWrapper glRenderbuffer;
size_t outBytes = outWidth * outHeight * 4 * GetGLTypeSize(readBackType);
cl_char *outBuffer = (cl_char *)malloc( outBytes );
GLenum err = 0;
memset(outBuffer, 0, outBytes);
glGenFramebuffersEXT( 1, &glFramebuffer );
glBindFramebufferEXT( GL_FRAMEBUFFER_EXT, glFramebuffer );
glFramebufferTexture2D(GL_FRAMEBUFFER, GL_COLOR_ATTACHMENT0, glTarget, glTexture, 0);
err = glGetError();
if (err != GL_NO_ERROR)
{
log_error("Failed to attach texture to FBO!\n");
return NULL;
}
glReadPixels( 0, 0, (GLsizei)outWidth, (GLsizei)outHeight, readBackFormat, readBackType, outBuffer );
#ifdef GLES_DEBUG
log_info( "- glGetTexImage: %s : %s : %s \n",
GetGLTargetName( glTarget),
GetGLFormatName(readBackFormat),
GetGLTypeName(readBackType));
DumpGLBuffer(readBackType, realWidth, realHeight, (void*)outBuffer);
#endif
return (void *)outBuffer;
}
int CreateGLRenderbufferRaw( GLsizei width, GLsizei height,
GLenum attachment,
GLenum rbFormat, GLenum rbType,
GLuint *outFramebuffer,
GLuint *outRenderbuffer )
{
GLenum err = 0;
// Generate a renderbuffer and bind
glGenRenderbuffersEXT( 1, outRenderbuffer );
glBindRenderbufferEXT( GL_RENDERBUFFER_EXT, *outRenderbuffer );
// Allocate storage to the renderbuffer
glGetError();
glRenderbufferStorageEXT( GL_RENDERBUFFER_EXT, rbFormat, (GLsizei)width, (GLsizei)height );
err = glGetError();
if( err != GL_NO_ERROR )
{
log_error("Failed to allocate render buffer storage!\n");
return 1701;
}
GLint realInternalFormat;
glGetRenderbufferParameterivEXT( GL_RENDERBUFFER_EXT, GL_RENDERBUFFER_INTERNAL_FORMAT_EXT, &realInternalFormat );
rbFormat = realInternalFormat;
#ifdef GLES_DEBUG
GLint rsize, gsize, bsize, asize;
glGetRenderbufferParameterivEXT(GL_RENDERBUFFER_EXT, GL_RENDERBUFFER_RED_SIZE_EXT,&rsize);
glGetRenderbufferParameterivEXT(GL_RENDERBUFFER_EXT, GL_RENDERBUFFER_GREEN_SIZE_EXT,&gsize);
glGetRenderbufferParameterivEXT(GL_RENDERBUFFER_EXT, GL_RENDERBUFFER_BLUE_SIZE_EXT,&bsize);
glGetRenderbufferParameterivEXT(GL_RENDERBUFFER_EXT, GL_RENDERBUFFER_ALPHA_SIZE_EXT,&asize);
log_info("Renderbuffer internal format requested: %s actual: %s sizes: r=%d g=%d b=%d a=%d\n",
GetGLFormatName( internalFormat ), GetGLFormatName( realInternalFormat ),
rsize, gsize, bsize, asize );
#endif
// Create and bind a framebuffer to render with
glGenFramebuffersEXT( 1, outFramebuffer );
glBindFramebufferEXT( GL_FRAMEBUFFER_EXT, *outFramebuffer );
if( err != GL_NO_ERROR )
{
log_error( "ERROR: Unable to bind framebuffer : Error %s\n",
gluErrorString( err ));
return -1;
}
// Attach to the framebuffer
glFramebufferRenderbufferEXT( GL_FRAMEBUFFER_EXT, attachment, GL_RENDERBUFFER_EXT, *outRenderbuffer );
err = glGetError();
GLint status = glCheckFramebufferStatusEXT( GL_FRAMEBUFFER_EXT );
if( status != GL_FRAMEBUFFER_COMPLETE_EXT )
{
log_error( "ERROR: Unable to attach renderbuffer to framebuffer (%s, status %x)\n", gluErrorString( err ), (int)status );
return -1;
}
return 0;
}
static void DrawQuad(void)
{
const char *vssrc =
"varying mediump vec2 texCoord;\n"
"attribute vec2 inPosition;\n"
"void main() {\n"
" texCoord = vec2((inPosition.x+1.0)/2.0, (inPosition.y+1.0)/2.0);\n"
" gl_Position = vec4(inPosition.x, inPosition.y, 0.0, 1.0);\n"
"}\n";
const char *fssrc =
"uniform sampler2D tex;\n"
"varying mediump vec2 texCoord;\n"
"void main() {\n"
" gl_FragColor = texture2D(tex, texCoord);\n"
"}\n";
GLuint vs, fs, program;
GLuint positionIdx = 0;
GLfloat x1 = -1.0f, x2 = 1.0f, y1 = -1.0f, y2 = 1.0f;
GLfloat vertices[4][2];
vertices[0][0] = x1; vertices[0][1] = y1;
vertices[1][0] = x2; vertices[1][1] = y1;
vertices[2][0] = x1; vertices[2][1] = y2;
vertices[3][0] = x2; vertices[3][1] = y2;
vs = glCreateShader(GL_VERTEX_SHADER);
fs = glCreateShader(GL_FRAGMENT_SHADER);
glShaderSource(vs, 1, &vssrc, NULL);
glShaderSource(fs, 1, &fssrc, NULL);
glCompileShader(vs);
glCompileShader(fs);
program = glCreateProgram();
glAttachShader(program, vs);
glAttachShader(program, fs);
glLinkProgram(program);
glUseProgram(program);
positionIdx = glGetAttribLocation(program, "inPosition");
glEnableVertexAttribArray(positionIdx);
glVertexAttribPointer(positionIdx, 2, GL_FLOAT, GL_FALSE, 0, vertices);
glDrawArrays(GL_TRIANGLE_STRIP, 0, 4);
glUseProgram(0);
glDeleteProgram(program);
glDeleteShader(vs);
glDeleteShader(fs);
}
void * CreateGLRenderbuffer( GLsizei width, GLsizei height,
GLenum attachment,
GLenum rbFormat, GLenum rbType,
GLenum texFormat, GLenum texType,
ExplicitType type,
GLuint *outFramebuffer,
GLuint *outRenderbuffer,
int *outError, MTdata d, bool allocateMem )
{
*outError = CreateGLRenderbufferRaw( width, height, attachment, rbFormat, rbType, outFramebuffer, outRenderbuffer );
if( *outError != 0 )
return NULL;
GLenum err = 0;
// Generate a renderbuffer and bind
glGenRenderbuffersEXT( 1, outRenderbuffer );
glBindRenderbufferEXT( GL_RENDERBUFFER_EXT, *outRenderbuffer );
// Allocate storage to the renderbuffer
glGetError();
glRenderbufferStorageEXT( GL_RENDERBUFFER_EXT, rbFormat, (GLsizei)width, (GLsizei)height );
err = glGetError();
if( err != GL_NO_ERROR )
{
*outError = 1701;
log_error("Failed to allocate render buffer storage!\n");
return NULL;
}
GLint realInternalFormat;
glGetRenderbufferParameterivEXT( GL_RENDERBUFFER_EXT, GL_RENDERBUFFER_INTERNAL_FORMAT_EXT, &realInternalFormat );
rbFormat = realInternalFormat;
#ifdef GLES_DEBUG
GLint rsize, gsize, bsize, asize;
glGetRenderbufferParameterivEXT(GL_RENDERBUFFER_EXT, GL_RENDERBUFFER_RED_SIZE_EXT,&rsize);
glGetRenderbufferParameterivEXT(GL_RENDERBUFFER_EXT, GL_RENDERBUFFER_GREEN_SIZE_EXT,&gsize);
glGetRenderbufferParameterivEXT(GL_RENDERBUFFER_EXT, GL_RENDERBUFFER_BLUE_SIZE_EXT,&bsize);
glGetRenderbufferParameterivEXT(GL_RENDERBUFFER_EXT, GL_RENDERBUFFER_ALPHA_SIZE_EXT,&asize);
log_info("Renderbuffer internal format requested: %s actual: %s sizes: r=%d g=%d b=%d a=%d\n",
GetGLFormatName( internalFormat ), GetGLFormatName( realInternalFormat ),
rsize, gsize, bsize, asize );
#endif
// Create and bind a framebuffer to render with
glGenFramebuffersEXT( 1, outFramebuffer );
glBindFramebufferEXT( GL_FRAMEBUFFER_EXT, *outFramebuffer );
err = glGetError();
if( err != GL_NO_ERROR )
{
log_error( "ERROR: Unable to bind framebuffer : Error %s\n",
gluErrorString( err ));
*outError = -1;
return NULL;
}
// Attach to the framebuffer
glFramebufferRenderbufferEXT( GL_FRAMEBUFFER_EXT, attachment, GL_RENDERBUFFER_EXT, *outRenderbuffer );
CHECK_ERROR();
GLint status = glCheckFramebufferStatusEXT( GL_FRAMEBUFFER_EXT );
if( status != GL_FRAMEBUFFER_COMPLETE_EXT )
{
*outError = -1;
log_error( "ERROR: Unable to attach renderbuffer to framebuffer (%s, status %x)\n", gluErrorString( err ), (int)status );
return NULL;
}
void* buffer = CreateRandomData(type, width * height * 4, d);
#ifdef GLES_DEBUG
log_info( "- Fillling renderbuffer: %d : %d : %s : %s \n",
(int)width, (int)height,
GetGLFormatName(glFormat),
GetGLTypeName(glType));
DumpGLBuffer(glType, (int)width, (int)height, (void*)buffer);
#endif
CHECK_ERROR();
// Fill a texture with our input data
glTextureWrapper texture;
glGenTextures( 1, &texture );
glBindTexture( GL_TEXTURE_2D, texture );
CHECK_ERROR();
glTexParameteri( GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER, GL_NEAREST );
glTexParameteri( GL_TEXTURE_2D, GL_TEXTURE_MAG_FILTER, GL_NEAREST );
glTexParameteri( GL_TEXTURE_2D, GL_TEXTURE_WRAP_S, GL_CLAMP_TO_EDGE );
glTexParameteri( GL_TEXTURE_2D, GL_TEXTURE_WRAP_T, GL_CLAMP_TO_EDGE );
CHECK_ERROR();
glTexImage2D( GL_TEXTURE_2D, 0, texFormat, width, height, 0, texFormat, texType, buffer );
CHECK_ERROR();
// Render fullscreen textured quad
glViewport(0, 0, width, height);
DrawQuad();
CHECK_ERROR();
// Read back the data in the renderbuffer
memset(buffer, 0, width * height * 4 * get_explicit_type_size( type ));
glReadPixels( 0, 0, (GLsizei)width, (GLsizei)height, texFormat, texType, buffer );
err = glGetError();
if( err != GL_NO_ERROR )
{
log_error( "ERROR: Unable to read data via glReadPixels : %d : %d : %s : %s : Error %s\n",
(int)width, (int)height,
GetGLFormatName(texFormat),
GetGLTypeName(texType),
gluErrorString( err ));
*outError = -1;
}
#ifdef GLES_DEBUG
log_info( "- glReadPixels: %d : %d : %s : %s \n",
(int)width, (int)height,
GetGLFormatName(glFormat),
GetGLTypeName(glType));
DumpGLBuffer(glType, (int)width, (int)height, (void*)buffer);
#endif
if( !allocateMem )
{
free( buffer );
return NULL;
}
#ifndef GL_ES_VERSION_2_0
if( glType == GL_UNSIGNED_INT_8_8_8_8_REV && glFormat == GL_BGRA && allocateMem )
{
// Reverse and reorder to validate since in the
// kernel the read_imagef() call always returns RGBA
cl_uchar *p = (cl_uchar *)buffer;
for( size_t i = 0; i < (size_t)width * height; i++ )
{
cl_uchar uc0 = p[i * 4 + 0];
cl_uchar uc1 = p[i * 4 + 1];
cl_uchar uc2 = p[i * 4 + 2];
cl_uchar uc3 = p[i * 4 + 3];
p[ i * 4 + 0 ] = uc2;
p[ i * 4 + 1 ] = uc1;
p[ i * 4 + 2 ] = uc0;
p[ i * 4 + 3 ] = uc3;
}
}
#endif
return buffer;
}
void * ReadGLRenderbuffer( GLuint glFramebuffer, GLuint glRenderbuffer,
GLenum attachment,
GLenum rbFormat, GLenum rbType,
GLenum texFormat, GLenum texType,
ExplicitType typeToReadAs,
size_t outWidth, size_t outHeight )
{
glBindFramebufferEXT( GL_FRAMEBUFFER_EXT, glFramebuffer );
glFramebufferRenderbufferEXT( GL_FRAMEBUFFER_EXT, attachment, GL_RENDERBUFFER_EXT, glRenderbuffer );
// Attach to the framebuffer
GLint err = glGetError();
if( glCheckFramebufferStatusEXT( GL_FRAMEBUFFER_EXT ) != GL_FRAMEBUFFER_COMPLETE_EXT )
{
log_error( "ERROR: Unable to attach renderbuffer to framebuffer (%s)\n", gluErrorString( err ) );
return NULL;
}
// Read results from the GL renderbuffer
#ifdef GLES_DEBUG
log_info( "- Reading back from GL: %d x %d : %s : %s : %s\n",
(int)outWidth, (int)outHeight,
GetGLFormatName( glInternalFormat ),
GetGLFormatName( glFormat ),
GetGLTypeName( glType ));
#endif
GLenum readBackFormat = GL_RGBA;
GLenum readBackType = texType;
size_t outBytes = outWidth * outHeight * 4 * GetGLTypeSize(readBackType);
void *outBuffer = malloc( outBytes );
memset(outBuffer, 0, outBytes);
glReadPixels( 0, 0, (GLsizei)outWidth, (GLsizei)outHeight, readBackFormat, readBackType, outBuffer );
#ifdef GLES_DEBUG
log_info( "- glReadPixels: %d : %d : %s : %s \n",
(int)outWidth, (int)outHeight,
GetGLFormatName(readBackFormat),
GetGLTypeName(readBackType));
DumpGLBuffer(readBackType, outWidth, outHeight, outBuffer);
#endif
return (void *)outBuffer;
}
GLenum
GetGLFormat(GLenum internalFormat)
{
GLenum glFormat;
switch (internalFormat)
{
case GL_BGRA:
#ifndef GL_ES_VERSION_2_0
case GL_RGBA8:
case GL_RGBA16:
case GL_RGBA32F_ARB:
#endif
glFormat = GL_RGBA;
break;
#ifndef GL_ES_VERSION_2_0
case GL_RGBA8I_EXT:
case GL_RGBA16I_EXT:
case GL_RGBA32I_EXT:
case GL_RGBA8UI_EXT:
case GL_RGBA16UI_EXT:
case GL_RGBA32UI_EXT:
glFormat = GL_RGBA_INTEGER_EXT;
break;
#endif
default:
glFormat = GL_RGBA;
break;
}
return glFormat;
}
GLenum GetGLTypeForExplicitType(ExplicitType type)
{
switch( type )
{
case kFloat:
return GL_FLOAT;
case kInt:
return GL_INT;
case kUInt:
return GL_UNSIGNED_INT;
case kShort:
return GL_SHORT;
case kUShort:
return GL_UNSIGNED_SHORT;
case kChar:
return GL_BYTE;
case kUChar:
return GL_UNSIGNED_BYTE;
case kHalf:
#if defined( __APPLE__ )
return GL_HALF_FLOAT;
#else
return GL_HALF_FLOAT_ARB;
#endif
default:
return GL_INT;
};
}
size_t GetGLTypeSize(GLenum type)
{
switch( type )
{
case GL_FLOAT:
return sizeof(GLfloat);
case GL_INT:
return sizeof(GLint);
case GL_UNSIGNED_INT:
return sizeof(GLuint);
case GL_SHORT:
return sizeof(GLshort);
case GL_UNSIGNED_SHORT:
return sizeof(GLushort);
case GL_BYTE:
return sizeof(GLbyte);
case GL_UNSIGNED_BYTE:
return sizeof(GLubyte);
#if defined( __APPLE__ )
case GL_HALF_FLOAT:
#else
case GL_HALF_FLOAT_ARB:
#endif
return sizeof(GLhalf);
default:
return kFloat;
};
}
ExplicitType GetExplicitTypeForGLType(GLenum type)
{
switch( type )
{
case GL_FLOAT:
return kFloat;
case GL_INT:
return kInt;
case GL_UNSIGNED_INT:
return kUInt;
case GL_SHORT:
return kShort;
case GL_UNSIGNED_SHORT:
return kUShort;
case GL_BYTE:
return kChar;
case GL_UNSIGNED_BYTE:
return kUChar;
#if defined( __APPLE__ )
case GL_HALF_FLOAT:
#else
case GL_HALF_FLOAT_ARB:
#endif
return kHalf;
default:
return kFloat;
};
}
GLenum get_base_gl_target( GLenum target )
{
switch( target )
{
case GL_TEXTURE_CUBE_MAP_POSITIVE_X:
case GL_TEXTURE_CUBE_MAP_POSITIVE_Y:
case GL_TEXTURE_CUBE_MAP_POSITIVE_Z:
case GL_TEXTURE_CUBE_MAP_NEGATIVE_X:
case GL_TEXTURE_CUBE_MAP_NEGATIVE_Y:
case GL_TEXTURE_CUBE_MAP_NEGATIVE_Z:
return GL_TEXTURE_CUBE_MAP;
default:
return target;
}
}
const char *GetGLTypeName( GLenum type )
{
switch( type )
{
case GL_BYTE: return "GL_BYTE";
case GL_UNSIGNED_BYTE: return "GL_UNSIGNED_BYTE";
case GL_INT: return "GL_INT";
case GL_UNSIGNED_INT: return "GL_UNSIGNED_INT";
case GL_SHORT: return "GL_SHORT";
case GL_UNSIGNED_SHORT: return "GL_UNSIGNED_SHORT";
#if defined( __APPLE__ )
case GL_HALF_FLOAT: return "GL_HALF_FLOAT";
#else
case GL_HALF_FLOAT_ARB: return "GL_HALF_FLOAT_ARB";
#endif
case GL_FLOAT: return "GL_FLOAT";
#ifndef GL_ES_VERSION_2_0
case GL_UNSIGNED_INT_8_8_8_8: return "GL_UNSIGNED_INT_8_8_8_8";
case GL_UNSIGNED_INT_8_8_8_8_REV: return "GL_UNSIGNED_INT_8_8_8_8_REV";
#endif
default:
{
static char foo[ 128 ];
sprintf( foo, "(Unknown:0x%08x)", (int)type );
return foo;
}
}
}
const char *GetGLTargetName( GLenum tgt )
{
if( tgt == GL_TEXTURE_2D ) return "GL_TEXTURE_2D";
if( tgt == GL_TEXTURE_3D ) return "GL_TEXTURE_3D";
#ifndef GL_ES_VERSION_2_0
if( tgt == GL_TEXTURE_RECTANGLE_EXT ) return "GL_TEXTURE_RECTANGLE_EXT";
#endif
if( tgt == GL_TEXTURE_CUBE_MAP_POSITIVE_X ) return "GL_TEXTURE_CUBE_MAP_POSITIVE_X";
if( tgt == GL_TEXTURE_CUBE_MAP_POSITIVE_Y ) return "GL_TEXTURE_CUBE_MAP_POSITIVE_Y";
if( tgt == GL_TEXTURE_CUBE_MAP_POSITIVE_Z ) return "GL_TEXTURE_CUBE_MAP_POSITIVE_Z";
if( tgt == GL_TEXTURE_CUBE_MAP_NEGATIVE_X ) return "GL_TEXTURE_CUBE_MAP_NEGATIVE_X";
if( tgt == GL_TEXTURE_CUBE_MAP_NEGATIVE_Y ) return "GL_TEXTURE_CUBE_MAP_NEGATIVE_Y";
if( tgt == GL_TEXTURE_CUBE_MAP_NEGATIVE_Z ) return "GL_TEXTURE_CUBE_MAP_NEGATIVE_Z";
return "";
}
const char *GetGLAttachmentName( GLenum att )
{
if( att == GL_COLOR_ATTACHMENT0_EXT ) return "GL_COLOR_ATTACHMENT0_EXT";
#ifndef GL_ES_VERSION_2_0
if( att == GL_COLOR_ATTACHMENT1_EXT ) return "GL_COLOR_ATTACHMENT1_EXT";
if( att == GL_COLOR_ATTACHMENT2_EXT ) return "GL_COLOR_ATTACHMENT2_EXT";
if( att == GL_COLOR_ATTACHMENT3_EXT ) return "GL_COLOR_ATTACHMENT3_EXT";
if( att == GL_COLOR_ATTACHMENT4_EXT ) return "GL_COLOR_ATTACHMENT4_EXT";
if( att == GL_COLOR_ATTACHMENT5_EXT ) return "GL_COLOR_ATTACHMENT5_EXT";
if( att == GL_COLOR_ATTACHMENT6_EXT ) return "GL_COLOR_ATTACHMENT6_EXT";
if( att == GL_COLOR_ATTACHMENT7_EXT ) return "GL_COLOR_ATTACHMENT7_EXT";
if( att == GL_COLOR_ATTACHMENT8_EXT ) return "GL_COLOR_ATTACHMENT8_EXT";
#endif
if( att == GL_DEPTH_ATTACHMENT_EXT ) return "GL_DEPTH_ATTACHMENT_EXT";
return "";
}
const char *GetGLBaseFormatName( GLenum baseformat )
{
switch( baseformat )
{
case GL_RGBA: return "GL_RGBA";
#ifdef GL_ES_VERSION_2_0
case GL_BGRA_EXT: return "GL_BGRA_EXT";
#else
case GL_RGBA8: return "GL_RGBA";
case GL_RGBA16: return "GL_RGBA";
case GL_BGRA: return "GL_BGRA";
case GL_RGBA8I_EXT: return "GL_RGBA_INTEGER_EXT";
case GL_RGBA16I_EXT: return "GL_RGBA_INTEGER_EXT";
case GL_RGBA32I_EXT: return "GL_RGBA_INTEGER_EXT";
case GL_RGBA8UI_EXT: return "GL_RGBA_INTEGER_EXT";
case GL_RGBA16UI_EXT: return "GL_RGBA_INTEGER_EXT";
case GL_RGBA32UI_EXT: return "GL_RGBA_INTEGER_EXT";
case GL_RGBA32F_ARB: return "GL_RGBA";
case GL_RGBA_INTEGER_EXT: return "GL_RGBA_INTEGER_EXT";
case GL_ALPHA4: return "GL_ALPHA";
case GL_ALPHA8: return "GL_ALPHA";
case GL_ALPHA12: return "GL_ALPHA";
case GL_ALPHA16: return "GL_ALPHA";
case GL_LUMINANCE4: return "GL_LUMINANCE";
case GL_LUMINANCE8: return "GL_LUMINANCE";
case GL_LUMINANCE12: return "GL_LUMINANCE";
case GL_LUMINANCE16: return "GL_LUMINANCE";
case GL_LUMINANCE4_ALPHA4: return "GL_LUMINANCE_ALPHA";
case GL_LUMINANCE6_ALPHA2: return "GL_LUMINANCE_ALPHA";
case GL_LUMINANCE8_ALPHA8: return "GL_LUMINANCE_ALPHA";
case GL_LUMINANCE12_ALPHA4: return "GL_LUMINANCE_ALPHA";
case GL_LUMINANCE12_ALPHA12: return "GL_LUMINANCE_ALPHA";
case GL_LUMINANCE16_ALPHA16: return "GL_LUMINANCE_ALPHA";
case GL_INTENSITY: return "GL_INTENSITY";
case GL_INTENSITY4: return "GL_INTENSITY";
case GL_INTENSITY8: return "GL_INTENSITY";
case GL_INTENSITY12: return "GL_INTENSITY";
case GL_INTENSITY16: return "GL_INTENSITY";
case GL_R3_G3_B2: return "GL_RGB";
case GL_RGB4: return "GL_RGB";
case GL_RGB5: return "GL_RGB";
case GL_RGB8: return "GL_RGB";
case GL_RGB10: return "GL_RGB";
case GL_RGB12: return "GL_RGB";
case GL_RGB16: return "GL_RGB";
case GL_RGBA2: return "GL_RGBA";
case GL_RGBA4: return "GL_RGBA";
case GL_RGB5_A1: return "GL_RGBA";
case GL_RGB10_A2: return "GL_RGBA";
case GL_RGBA12: return "GL_RGBA";
#endif
default:
{
static char foo[ 128 ];
sprintf( foo, "(Unknown:0x%08x)", (int)baseformat );
return foo;
}
}
}
const char *GetGLFormatName( GLenum format )
{
switch( format )
{
case GL_RGBA: return "GL_RGBA";
#ifdef GL_ES_VERSION_2_0
case GL_BGRA_EXT: return "GL_BGRA_EXT";
#else
case GL_RGBA8: return "GL_RGBA8";
case GL_RGBA16: return "GL_RGBA16";
case GL_BGRA: return "GL_BGRA";
case GL_RGBA8I_EXT: return "GL_RGBA8I_EXT";
case GL_RGBA16I_EXT: return "GL_RGBA16I_EXT";
case GL_RGBA32I_EXT: return "GL_RGBA32I_EXT";
case GL_RGBA8UI_EXT: return "GL_RGBA8UI_EXT";
case GL_RGBA16UI_EXT: return "GL_RGBA16UI_EXT";
case GL_RGBA32UI_EXT: return "GL_RGBA32UI_EXT";
case GL_RGBA32F_ARB: return "GL_RGBA32F_ARB";
case GL_RGBA_INTEGER_EXT: return "GL_RGBA_INTEGER_EXT";
case GL_ALPHA4: return "GL_ALPHA4";
case GL_ALPHA8: return "GL_ALPHA8";
case GL_ALPHA12: return "GL_ALPHA12";
case GL_ALPHA16: return "GL_ALPHA16";
case GL_LUMINANCE4: return "GL_LUMINANCE4";
case GL_LUMINANCE8: return "GL_LUMINANCE8";
case GL_LUMINANCE12: return "GL_LUMINANCE12";
case GL_LUMINANCE16: return "GL_LUMINANCE16";
case GL_LUMINANCE4_ALPHA4: return "GL_LUMINANCE4_ALPHA4";
case GL_LUMINANCE6_ALPHA2: return "GL_LUMINANCE6_ALPHA2";
case GL_LUMINANCE8_ALPHA8: return "GL_LUMINANCE8_ALPHA8";
case GL_LUMINANCE12_ALPHA4: return "GL_LUMINANCE12_ALPHA4";
case GL_LUMINANCE12_ALPHA12: return "GL_LUMINANCE12_ALPHA12";
case GL_LUMINANCE16_ALPHA16: return "GL_LUMINANCE16_ALPHA16";
case GL_INTENSITY: return "GL_INTENSITY";
case GL_INTENSITY4: return "GL_INTENSITY4";
case GL_INTENSITY8: return "GL_INTENSITY8";
case GL_INTENSITY12: return "GL_INTENSITY12";
case GL_INTENSITY16: return "GL_INTENSITY16";
case GL_R3_G3_B2: return "GL_R3_G3_B2";
case GL_RGB4: return "GL_RGB4";
case GL_RGB5: return "GL_RGB5";
case GL_RGB8: return "GL_RGB8";
case GL_RGB10: return "GL_RGB10";
case GL_RGB12: return "GL_RGB12";
case GL_RGB16: return "GL_RGB16";
case GL_RGBA2: return "GL_RGBA2";
case GL_RGBA4: return "GL_RGBA4";
case GL_RGB5_A1: return "GL_RGB5_A1";
case GL_RGB10_A2: return "GL_RGB10_A2";
case GL_RGBA12: return "GL_RGBA12";
#endif
case GL_INT: return "GL_INT";
case GL_UNSIGNED_INT: return "GL_UNSIGNED_INT";
case GL_SHORT: return "GL_SHORT";
case GL_UNSIGNED_SHORT: return "GL_UNSIGNED_SHORT";
case GL_BYTE: return "GL_BYTE";
case GL_UNSIGNED_BYTE: return "GL_UNSIGNED_BYTE";
case GL_FLOAT: return "GL_FLOAT";
#ifdef GL_ES_VERSION_2_0
case GL_HALF_FLOAT_OES: return "GL_HALF_FLOAT_OES";
#else
#if defined( __APPLE__ )
case GL_HALF_FLOAT: return "GL_HALF_FLOAT";
#else
case GL_HALF_FLOAT_ARB: return "GL_HALF_FLOAT_ARB";
#endif
#endif
default:
{
static char foo[ 128 ];
sprintf( foo, "(Unknown:0x%08x)", (int)format );
return foo;
}
}
}
void* CreateRandomData( ExplicitType type, size_t count, MTdata d )
{
switch(type)
{
case (kChar):
{
cl_char *p = (cl_char *)malloc(count * sizeof(cl_char));
if(!p) return 0;
for( size_t i = 0; i < count; i++ )
{
p[ i ] = (cl_char)genrand_int32(d);
}
return (void*)p;
}
case (kUChar):
{
cl_uchar *p = (cl_uchar *)malloc(count * sizeof(cl_uchar));
if(!p) return 0;
for( size_t i = 0; i < count; i++ )
{
p[ i ] = (cl_uchar)genrand_int32(d);
}
return (void*)p;
}
case (kShort):
{
cl_short *p = (cl_short *)malloc(count * sizeof(cl_short));
if(!p) return 0;
for( size_t i = 0; i < count; i++ )
{
p[ i ] = (cl_short)genrand_int32(d);
}
return (void*)p;
}
case (kUShort):
{
cl_ushort *p = (cl_ushort *)malloc(count * sizeof(cl_ushort));
if(!p) return 0;
for( size_t i = 0; i < count; i++ )
{
p[ i ] = (cl_ushort)genrand_int32(d);
}
return (void*)p;
}
case (kInt):
{
cl_int *p = (cl_int *)malloc(count * sizeof(cl_int));
if(!p) return 0;
for( size_t i = 0; i < count; i++ )
{
p[ i ] = (cl_int)genrand_int32(d);
}
return (void*)p;
}
case (kUInt):
{
cl_uint *p = (cl_uint *)malloc(count * sizeof(cl_uint));
if(!p) return 0;
for( size_t i = 0; i < count; i++ )
{
p[ i ] = (cl_uint)genrand_int32(d);
}
return (void*)p;
}
case (kFloat):
{
cl_float *p = (cl_float *)malloc(count * sizeof(cl_float));
if(!p) return 0;
for( size_t i = 0; i < count; i++ )
{
p[ i ] = get_random_float( 0.f, 1.f, d );
}
return (void*)p;
}
/* added support for half floats */
case (kHalf):
{
cl_half *p = (cl_half *)malloc(count * sizeof(cl_half));
if(!p) return 0;
for( size_t i = 0; i < count; i++ )
{
p[i] = cl_half_from_float(get_random_float(0.f, 1.f, d),
CL_HALF_RTE);
}
return (void*)p;
}
default:
{
log_error("Invalid explicit type specified for create random data!\n");
return 0;
}
}
return 0;
}
void DumpGLBuffer(GLenum type, size_t width, size_t height, void* buffer)
{
size_t i;
size_t count = width * height;
if(type == GL_BYTE)
{
cl_char* p = (cl_char*)buffer;
for(i = 0; i < count; i++)
log_info("[%4d] %3d %3d %3d %3d\n", (unsigned int)(i),
p[i* 4 + 0],
p[i* 4 + 1],
p[i* 4 + 2],
p[i* 4 + 3]);
}
else if(type == GL_UNSIGNED_BYTE)
{
cl_uchar* p = (cl_uchar*)buffer;
for(i = 0; i < count; i++)
log_info("[%4d] %3d %3d %3d %3d\n", (unsigned int)(i),
p[i* 4 + 0],
p[i* 4 + 1],
p[i* 4 + 2],
p[i* 4 + 3]);
}
else if(type == GL_INT)
{
cl_int* p = (cl_int*)buffer;
for(i = 0; i < count; i++)
log_info("[%4d] %3d %3d %3d %3d\n", (unsigned int)(i),
p[i* 4 + 0],
p[i* 4 + 1],
p[i* 4 + 2],
p[i* 4 + 3]);
}
else if(type == GL_UNSIGNED_INT)
{
cl_uint* p = (cl_uint*)buffer;
for(i = 0; i < count; i++)
log_info("[%4d] %3d %3d %3d %3d\n", (unsigned int)(i),
p[i* 4 + 0],
p[i* 4 + 1],
p[i* 4 + 2],
p[i* 4 + 3]);
}
else if(type == GL_SHORT)
{
cl_short* p = (cl_short*)buffer;
for(i = 0; i < count; i++)
log_info("[%4d] %3d %3d %3d %3d\n", (unsigned int)(i),
p[i* 4 + 0],
p[i* 4 + 1],
p[i* 4 + 2],
p[i* 4 + 3]);
}
else if(type == GL_UNSIGNED_SHORT)
{
cl_ushort* p = (cl_ushort*)buffer;
for(i = 0; i < count; i++)
log_info("[%4d] %3d %3d %3d %3d\n", (unsigned int)(i),
p[i* 4 + 0],
p[i* 4 + 1],
p[i* 4 + 2],
p[i* 4 + 3]);
}
else if(type == GL_FLOAT)
{
cl_float* p = (cl_float*)buffer;
for(i = 0; i < count; i++)
log_info("[%4d] %#f %#f %#f %#f\n", (unsigned int)(i),
p[i* 4 + 0],
p[i* 4 + 1],
p[i* 4 + 2],
p[i* 4 + 3]);
}
}
#if defined(_WIN32)
#include <string.h>
GLboolean gluCheckExtension(const GLubyte *extName, const GLubyte *extString)
{
const size_t len = strlen((const char*)extName);
const char* str = (const char*)extString;
while (str != NULL) {
str = strstr(str, (const char*)extName);
if (str == NULL) {
break;
}
if ((str > (const char*)extString || str[-1] == ' ')
&& (str[len] == ' ' || str[len] == '\0')) {
return GL_TRUE;
}
str = strchr(str + len, ' ');
}
return GL_FALSE;
}
#endif
// Function pointers for the GL/CL calls
clCreateFromGLBuffer_fn clCreateFromGLBuffer_ptr;
clCreateFromGLTexture_fn clCreateFromGLTexture_ptr;
clCreateFromGLRenderbuffer_fn clCreateFromGLRenderbuffer_ptr;
clGetGLObjectInfo_fn clGetGLObjectInfo_ptr;
clGetGLTextureInfo_fn clGetGLTextureInfo_ptr;
clEnqueueAcquireGLObjects_fn clEnqueueAcquireGLObjects_ptr;
clEnqueueReleaseGLObjects_fn clEnqueueReleaseGLObjects_ptr;
int init_clgl_ext(cl_platform_id platform_id)
{
// Create the function pointer table
clCreateFromGLBuffer_ptr = (clCreateFromGLBuffer_fn)clGetExtensionFunctionAddressForPlatform(platform_id, "clCreateFromGLBuffer");
if (clCreateFromGLBuffer_ptr == NULL)
{
log_error("clGetExtensionFunctionAddressForPlatform(clCreateFromGLBuffer) returned NULL.\n");
return -1;
}
clCreateFromGLTexture_ptr = (clCreateFromGLTexture_fn)clGetExtensionFunctionAddressForPlatform(platform_id, "clCreateFromGLTexture");
if (clCreateFromGLTexture_ptr == NULL)
{
log_error("clGetExtensionFunctionAddressForPlatform(clCreateFromGLTexture) returned NULL.\n");
return -1;
}
clCreateFromGLRenderbuffer_ptr = (clCreateFromGLRenderbuffer_fn)clGetExtensionFunctionAddressForPlatform(platform_id, "clCreateFromGLRenderbuffer");
if (clCreateFromGLRenderbuffer_ptr == NULL)
{
log_error("clGetExtensionFunctionAddressForPlatform(clCreateFromGLRenderbuffer) returned NULL.\n");
return -1;
}
clGetGLObjectInfo_ptr = (clGetGLObjectInfo_fn)clGetExtensionFunctionAddressForPlatform(platform_id, "clGetGLObjectInfo");
if (clGetGLObjectInfo_ptr == NULL)
{
log_error("clGetExtensionFunctionAddressForPlatform(clGetGLObjectInfo) returned NULL.\n");
return -1;
}
clGetGLTextureInfo_ptr = (clGetGLTextureInfo_fn)clGetExtensionFunctionAddressForPlatform(platform_id, "clGetGLTextureInfo");
if (clGetGLTextureInfo_ptr == NULL)
{
log_error("clGetExtensionFunctionAddressForPlatform(clGetGLTextureInfo) returned NULL.\n");
return -1;
}
clEnqueueAcquireGLObjects_ptr = (clEnqueueAcquireGLObjects_fn)clGetExtensionFunctionAddressForPlatform(platform_id, "clEnqueueAcquireGLObjects");
if (clEnqueueAcquireGLObjects_ptr == NULL)
{
log_error("clGetExtensionFunctionAddressForPlatform(clEnqueueAcquireGLObjects) returned NULL.\n");
return -1;
}
clEnqueueReleaseGLObjects_ptr = (clEnqueueReleaseGLObjects_fn)clGetExtensionFunctionAddressForPlatform(platform_id, "clEnqueueReleaseGLObjects");
if (clEnqueueReleaseGLObjects_ptr == NULL)
{
log_error("clGetExtensionFunctionAddressForPlatform(clEnqueueReleaseGLObjects) returned NULL.\n");
return -1;
}
return 0;
}