#include #include #include #include "../src/glsl/glsl_optimizer.h" #define GL_GLEXT_PROTOTYPES 1 #if __linux__ #define GOT_GFX 0 #else #define GOT_GFX 1 #endif #if GOT_GFX // ---- Windows GL bits #ifdef _MSC_VER #define GOT_MORE_THAN_GLSL_120 1 #include #include extern "C" { typedef char GLchar; /* native character */ typedef unsigned int GLuint; /* shader object handle */ #define GL_VERTEX_SHADER 0x8B31 #define GL_FRAGMENT_SHADER 0x8B30 #define GL_COMPILE_STATUS 0x8B81 typedef void (WINAPI * PFNGLDELETESHADERPROC) (GLuint shader); typedef GLuint (WINAPI * PFNGLCREATESHADERPROC) (GLenum type); typedef void (WINAPI * PFNGLSHADERSOURCEPROC) (GLuint shader, GLsizei count, const GLchar *const*string, const GLint *length); typedef void (WINAPI * PFNGLCOMPILESHADERPROC) (GLuint shader); typedef void (WINAPI * PFNGLGETSHADERINFOLOGPROC) (GLuint shader, GLsizei bufSize, GLsizei *length, GLchar *infoLog); typedef void (WINAPI * PFNGLGETSHADERIVPROC) (GLuint shader, GLenum pname, GLint *params); static PFNGLDELETESHADERPROC glDeleteShader; static PFNGLCREATESHADERPROC glCreateShader; static PFNGLSHADERSOURCEPROC glShaderSource; static PFNGLCOMPILESHADERPROC glCompileShader; static PFNGLGETSHADERINFOLOGPROC glGetShaderInfoLog; static PFNGLGETSHADERIVPROC glGetShaderiv; } #endif // #ifdef _MSC_VER // ---- Apple GL bits #ifdef __APPLE__ #define GOT_MORE_THAN_GLSL_120 0 #include #include #include #include #include static CGLContextObj s_GLContext; static CGLContextObj s_GLContext3; static bool s_GL3Active = false; #endif // ifdef __APPLE__ #else // #if GOT_GFX #define GOT_MORE_THAN_GLSL_120 0 #include #include #include "dirent.h" #include "GL/gl.h" #include "GL/glext.h" #endif // ! #if GOT_GFX #ifndef _MSC_VER #include #endif static bool InitializeOpenGL () { bool hasGLSL = false; #if GOT_GFX #ifdef _MSC_VER // setup minimal required GL HWND wnd = CreateWindowA( "STATIC", "GL", WS_OVERLAPPEDWINDOW | WS_CLIPSIBLINGS | WS_CLIPCHILDREN, 0, 0, 16, 16, NULL, NULL, GetModuleHandle(NULL), NULL ); HDC dc = GetDC( wnd ); PIXELFORMATDESCRIPTOR pfd = { sizeof(PIXELFORMATDESCRIPTOR), 1, PFD_DRAW_TO_WINDOW | PFD_SUPPORT_OPENGL, PFD_TYPE_RGBA, 32, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 16, 0, 0, PFD_MAIN_PLANE, 0, 0, 0, 0 }; int fmt = ChoosePixelFormat( dc, &pfd ); SetPixelFormat( dc, fmt, &pfd ); HGLRC rc = wglCreateContext( dc ); wglMakeCurrent( dc, rc ); #elif defined(__APPLE__) CGLPixelFormatAttribute attributes[] = { kCGLPFAAccelerated, // no software rendering (CGLPixelFormatAttribute) 0 }; CGLPixelFormatAttribute attributes3[] = { kCGLPFAAccelerated, // no software rendering kCGLPFAOpenGLProfile, // core profile with the version stated below (CGLPixelFormatAttribute) kCGLOGLPVersion_3_2_Core, (CGLPixelFormatAttribute) 0 }; GLint num; CGLPixelFormatObj pix; // create legacy context CGLChoosePixelFormat(attributes, &pix, &num); if (pix == NULL) return false; CGLCreateContext(pix, NULL, &s_GLContext); if (s_GLContext == NULL) return false; CGLDestroyPixelFormat(pix); CGLSetCurrentContext(s_GLContext); // create core 3.2 context CGLChoosePixelFormat(attributes3, &pix, &num); if (pix == NULL) return false; CGLCreateContext(pix, NULL, &s_GLContext3); if (s_GLContext3 == NULL) return false; CGLDestroyPixelFormat(pix); #endif // check if we have GLSL const char* extensions = (const char*)glGetString(GL_EXTENSIONS); hasGLSL = extensions != NULL && strstr(extensions, "GL_ARB_shader_objects") && strstr(extensions, "GL_ARB_vertex_shader") && strstr(extensions, "GL_ARB_fragment_shader"); #if defined(__APPLE__) // using core profile; always has GLSL hasGLSL = true; #endif #ifdef _MSC_VER if (hasGLSL) { glDeleteShader = (PFNGLDELETESHADERPROC)wglGetProcAddress("glDeleteShader"); glCreateShader = (PFNGLCREATESHADERPROC)wglGetProcAddress("glCreateShader"); glShaderSource = (PFNGLSHADERSOURCEPROC)wglGetProcAddress("glShaderSource"); glCompileShader = (PFNGLCOMPILESHADERPROC)wglGetProcAddress("glCompileShader"); glGetShaderInfoLog = (PFNGLGETSHADERINFOLOGPROC)wglGetProcAddress("glGetShaderInfoLog"); glGetShaderiv = (PFNGLGETSHADERIVPROC)wglGetProcAddress("glGetShaderiv"); } #endif #endif return hasGLSL; } static void CleanupGL() { #if GOT_GFX #ifdef __APPLE__ CGLSetCurrentContext(NULL); if (s_GLContext) CGLDestroyContext(s_GLContext); if (s_GLContext3) CGLDestroyContext(s_GLContext3); #endif // #ifdef __APPLE__ #endif // #if GOT_GFX } static bool InitializeMetal () { bool hasMetal = false; #if defined(__APPLE__) hasMetal = true; //@TODO: detect metal compiler presence #endif return hasMetal; } static void replace_string (std::string& target, const std::string& search, const std::string& replace, size_t startPos) { if (search.empty()) return; std::string::size_type p = startPos; while ((p = target.find (search, p)) != std::string::npos) { target.replace (p, search.size (), replace); p += replace.size (); } } static bool CheckGLSL (bool vertex, bool gles, const std::string& testName, const char* prefix, const std::string& source) { #if !GOT_GFX return true; // just assume it's ok #endif #if !GOT_MORE_THAN_GLSL_120 if (source.find("#version 140") != std::string::npos) return true; #endif const bool need3 = (source.find("#version 150") != std::string::npos) || (source.find("#version 300") != std::string::npos); # ifdef __APPLE__ // Mac core context does not accept any older shader versions, so need to switch to // either legacy context or core one. if (need3) { if (!s_GL3Active) CGLSetCurrentContext(s_GLContext3); s_GL3Active = true; } else { if (s_GL3Active) CGLSetCurrentContext(s_GLContext); s_GL3Active = false; } # endif // ifdef __APPLE__ std::string src; if (gles) { src += "#define lowp\n"; src += "#define mediump\n"; src += "#define highp\n"; src += "#define texture2DLodEXT texture2DLod\n"; src += "#define texture2DProjLodEXT texture2DProjLod\n"; src += "#define texture2DGradEXT texture2DGradARB\n"; src += "#define textureCubeGradEXT textureCubeGradARB\n"; src += "#define gl_FragDepthEXT gl_FragDepth\n"; if (!need3) { src += "#define gl_LastFragData _glesLastFragData\n"; src += "varying lowp vec4 _glesLastFragData[4];\n"; } if (!need3) { src += "float shadow2DEXT (sampler2DShadow s, vec3 p) { return shadow2D(s,p).r; }\n"; src += "float shadow2DProjEXT (sampler2DShadow s, vec4 p) { return shadow2DProj(s,p).r; }\n"; } } src += source; if (gles) { replace_string (src, "GL_EXT_shader_texture_lod", "GL_ARB_shader_texture_lod", 0); replace_string (src, "GL_EXT_draw_instanced", "GL_ARB_draw_instanced", 0); replace_string (src, "gl_InstanceIDEXT", "gl_InstanceIDARB ", 0); replace_string (src, "#extension GL_OES_standard_derivatives : require", "", 0); replace_string (src, "#extension GL_EXT_shadow_samplers : require", "", 0); replace_string (src, "#extension GL_EXT_frag_depth : require", "", 0); replace_string (src, "#extension GL_OES_standard_derivatives : enable", "", 0); replace_string (src, "#extension GL_EXT_shadow_samplers : enable", "", 0); replace_string (src, "#extension GL_EXT_frag_depth : enable", "", 0); replace_string (src, "#extension GL_EXT_draw_buffers : enable", "", 0); replace_string (src, "#extension GL_EXT_draw_buffers : require", "", 0); replace_string (src, "precision ", "// precision ", 0); replace_string (src, "#version 300 es", "", 0); } // can't check FB fetch on PC if (src.find("#extension GL_EXT_shader_framebuffer_fetch") != std::string::npos) return true; if (gles && need3) { src = "#version 330\n" + src; } const char* sourcePtr = src.c_str(); GLuint shader = glCreateShader (vertex ? GL_VERTEX_SHADER : GL_FRAGMENT_SHADER); glShaderSource (shader, 1, &sourcePtr, NULL); glCompileShader (shader); GLint status; glGetShaderiv (shader, GL_COMPILE_STATUS, &status); bool res = true; if (status != GL_TRUE) { char log[20000]; log[0] = 0; GLsizei logLength; glGetShaderInfoLog (shader, sizeof(log), &logLength, log); printf ("\n %s: real glsl compiler error on %s:\n%s\n", testName.c_str(), prefix, log); res = false; } glDeleteShader (shader); return res; } static bool CheckMetal (bool vertex, bool gles, const std::string& testName, const char* prefix, const std::string& source) { #if !GOT_GFX || !defined(__APPLE__) return true; // just assume it's ok #else FILE* f = fopen ("metalTemp.metal", "wb"); fwrite (source.c_str(), source.size(), 1, f); fclose (f); #if defined(__ENVIRONMENT_MAC_OS_X_VERSION_MIN_REQUIRED__) int res = system("/Applications/Xcode.app/Contents/Developer/Platforms/iPhoneOS.platform/usr/bin/metal metalTemp.metal -o metalTemp.o -std=ios-metal1.0 -Wno-parentheses-equality"); if (res != 0) { printf ("\n %s: Metal compiler failed\n", testName.c_str()); return false; } #endif // return true; #endif } static bool ReadStringFromFile (const char* pathName, std::string& output) { FILE* file = fopen( pathName, "rb" ); if (file == NULL) return false; fseek(file, 0, SEEK_END); int length = ftell(file); fseek(file, 0, SEEK_SET); if (length < 0) { fclose( file ); return false; } output.resize(length); int readLength = fread(&*output.begin(), 1, length, file); fclose(file); if (readLength != length) { output.clear(); return false; } replace_string(output, "\r\n", "\n", 0); return true; } bool EndsWith (const std::string& str, const std::string& sub) { return (str.size() >= sub.size()) && (strncmp (str.c_str()+str.size()-sub.size(), sub.c_str(), sub.size())==0); } typedef std::vector StringVector; static StringVector GetFiles (const std::string& folder, const std::string& endsWith) { StringVector res; #ifdef _MSC_VER WIN32_FIND_DATAA FindFileData; HANDLE hFind = FindFirstFileA ((folder+"/*"+endsWith).c_str(), &FindFileData); if (hFind == INVALID_HANDLE_VALUE) return res; do { res.push_back (FindFileData.cFileName); } while (FindNextFileA (hFind, &FindFileData)); FindClose (hFind); #else DIR *dirp; struct dirent *dp; if ((dirp = opendir(folder.c_str())) == NULL) return res; while ( (dp = readdir(dirp)) ) { std::string fname = dp->d_name; if (fname == "." || fname == "..") continue; if (!EndsWith (fname, endsWith)) continue; res.push_back (fname); } closedir(dirp); #endif return res; } static void DeleteFile (const std::string& path) { #ifdef _MSC_VER DeleteFileA (path.c_str()); #else unlink (path.c_str()); #endif } static void MassageVertexForGLES (std::string& s) { if (s.find ("_glesVertex") != std::string::npos) return; std::string pre; std::string version = "#version 300 es\n"; size_t insertPoint = s.find(version); if (insertPoint != std::string::npos) { insertPoint += version.size(); pre += "#define gl_Vertex _glesVertex\nin highp vec4 _glesVertex;\n"; pre += "#define gl_Normal _glesNormal\nin mediump vec3 _glesNormal;\n"; pre += "#define gl_MultiTexCoord0 _glesMultiTexCoord0\nin highp vec4 _glesMultiTexCoord0;\n"; pre += "#define gl_MultiTexCoord1 _glesMultiTexCoord1\nin highp vec4 _glesMultiTexCoord1;\n"; pre += "#define gl_Color _glesColor\nin lowp vec4 _glesColor;\n"; } else { insertPoint = 0; pre += "#define gl_Vertex _glesVertex\nattribute highp vec4 _glesVertex;\n"; pre += "#define gl_Normal _glesNormal\nattribute mediump vec3 _glesNormal;\n"; pre += "#define gl_MultiTexCoord0 _glesMultiTexCoord0\nattribute highp vec4 _glesMultiTexCoord0;\n"; pre += "#define gl_MultiTexCoord1 _glesMultiTexCoord1\nattribute highp vec4 _glesMultiTexCoord1;\n"; pre += "#define gl_Color _glesColor\nattribute lowp vec4 _glesColor;\n"; } s.insert (insertPoint, pre); } static void MassageFragmentForGLES (std::string& s) { std::string pre; s = pre + s; } static const char* kGlslTypeNames[kGlslTypeCount] = { "float", "int", "bool", "2d", "3d", "cube", "2dshadow", "2darray", "other", }; static const char* kGlslPrecNames[kGlslPrecCount] = { "high", "medium", "low", }; static bool TestFile (glslopt_ctx* ctx, bool vertex, const std::string& testName, const std::string& inputPath, const std::string& outputPath, bool gles, bool doCheckGLSL, bool doCheckMetal) { std::string input; if (!ReadStringFromFile (inputPath.c_str(), input)) { printf ("\n %s: failed to read input file\n", testName.c_str()); return false; } if (doCheckGLSL) { if (!CheckGLSL (vertex, gles, testName, "input", input.c_str())) return false; } if (gles) { if (vertex) MassageVertexForGLES (input); else MassageFragmentForGLES (input); } bool res = true; glslopt_shader_type type = vertex ? kGlslOptShaderVertex : kGlslOptShaderFragment; glslopt_shader* shader = glslopt_optimize (ctx, type, input.c_str(), 0); bool optimizeOk = glslopt_get_status(shader); if (optimizeOk) { std::string textHir = glslopt_get_raw_output (shader); std::string textOpt = glslopt_get_output (shader); // append stats char buffer[1000]; int statsAlu, statsTex, statsFlow; glslopt_shader_get_stats (shader, &statsAlu, &statsTex, &statsFlow); sprintf(buffer, "\n// stats: %i alu %i tex %i flow\n", statsAlu, statsTex, statsFlow); textOpt += buffer; // append inputs const int inputCount = glslopt_shader_get_input_count (shader); if (inputCount > 0) { sprintf(buffer, "// inputs: %i\n", inputCount); textOpt += buffer; } for (int i = 0; i < inputCount; ++i) { const char* parName; glslopt_basic_type parType; glslopt_precision parPrec; int parVecSize, parMatSize, parArrSize, location; glslopt_shader_get_input_desc(shader, i, &parName, &parType, &parPrec, &parVecSize, &parMatSize, &parArrSize, &location); if (location >= 0) sprintf(buffer, "// #%i: %s (%s %s) %ix%i [%i] loc %i\n", i, parName, kGlslPrecNames[parPrec], kGlslTypeNames[parType], parVecSize, parMatSize, parArrSize, location); else sprintf(buffer, "// #%i: %s (%s %s) %ix%i [%i]\n", i, parName, kGlslPrecNames[parPrec], kGlslTypeNames[parType], parVecSize, parMatSize, parArrSize); textOpt += buffer; } // append uniforms const int uniformCount = glslopt_shader_get_uniform_count (shader); const int uniformSize = glslopt_shader_get_uniform_total_size (shader); if (uniformCount > 0) { sprintf(buffer, "// uniforms: %i (total size: %i)\n", uniformCount, uniformSize); textOpt += buffer; } for (int i = 0; i < uniformCount; ++i) { const char* parName; glslopt_basic_type parType; glslopt_precision parPrec; int parVecSize, parMatSize, parArrSize, location; glslopt_shader_get_uniform_desc(shader, i, &parName, &parType, &parPrec, &parVecSize, &parMatSize, &parArrSize, &location); if (location >= 0) sprintf(buffer, "// #%i: %s (%s %s) %ix%i [%i] loc %i\n", i, parName, kGlslPrecNames[parPrec], kGlslTypeNames[parType], parVecSize, parMatSize, parArrSize, location); else sprintf(buffer, "// #%i: %s (%s %s) %ix%i [%i]\n", i, parName, kGlslPrecNames[parPrec], kGlslTypeNames[parType], parVecSize, parMatSize, parArrSize); textOpt += buffer; } // append textures const int textureCount = glslopt_shader_get_texture_count (shader); if (textureCount > 0) { sprintf(buffer, "// textures: %i\n", textureCount); textOpt += buffer; } for (int i = 0; i < textureCount; ++i) { const char* parName; glslopt_basic_type parType; glslopt_precision parPrec; int parVecSize, parMatSize, parArrSize, location; glslopt_shader_get_texture_desc(shader, i, &parName, &parType, &parPrec, &parVecSize, &parMatSize, &parArrSize, &location); if (location >= 0) sprintf(buffer, "// #%i: %s (%s %s) %ix%i [%i] loc %i\n", i, parName, kGlslPrecNames[parPrec], kGlslTypeNames[parType], parVecSize, parMatSize, parArrSize, location); else sprintf(buffer, "// #%i: %s (%s %s) %ix%i [%i]\n", i, parName, kGlslPrecNames[parPrec], kGlslTypeNames[parType], parVecSize, parMatSize, parArrSize); textOpt += buffer; } std::string outputOpt; ReadStringFromFile (outputPath.c_str(), outputOpt); if (res && doCheckMetal && !CheckMetal (vertex, gles, testName, "metal", textOpt.c_str())) res = false; if (textOpt != outputOpt) { // write output FILE* f = fopen (outputPath.c_str(), "wb"); if (!f) { printf ("\n %s: can't write to optimized file!\n", testName.c_str()); } else { fwrite (textOpt.c_str(), 1, textOpt.size(), f); fclose (f); } printf ("\n %s: does not match optimized output\n", testName.c_str()); res = false; } if (res && doCheckGLSL && !CheckGLSL (vertex, gles, testName, "raw", textHir.c_str())) res = false; if (res && doCheckGLSL && !CheckGLSL (vertex, gles, testName, "optimized", textOpt.c_str())) res = false; } else { printf ("\n %s: optimize error: %s\n", testName.c_str(), glslopt_get_log(shader)); res = false; } glslopt_shader_delete (shader); return res; } int main (int argc, const char** argv) { if (argc < 2) { printf ("USAGE: glsloptimizer testfolder\n"); return 1; } bool hasOpenGL = InitializeOpenGL (); bool hasMetal = InitializeMetal (); glslopt_ctx* ctx[3] = { glslopt_initialize(kGlslTargetOpenGLES20), glslopt_initialize(kGlslTargetOpenGLES30), glslopt_initialize(kGlslTargetOpenGL), }; glslopt_ctx* ctxMetal = glslopt_initialize(kGlslTargetMetal); std::string baseFolder = argv[1]; clock_t time0 = clock(); // 2.39s // ralloc fix 256 initial: 1.35s static const char* kTypeName[2] = { "vertex", "fragment" }; size_t tests = 0; size_t errors = 0; for (int type = 0; type < 2; ++type) { std::string testFolder = baseFolder + "/" + kTypeName[type]; static const char* kAPIName[3] = { "OpenGL ES 2.0", "OpenGL ES 3.0", "OpenGL" }; static const char* kApiIn [3] = {"-inES.txt", "-inES3.txt", "-in.txt"}; static const char* kApiOut[3] = {"-outES.txt", "-outES3.txt", "-out.txt"}; static const char* kApiOutMetal[3] = {"-outESMetal.txt", "-outES3Metal.txt", "-outMetal.txt"}; for (int api = 0; api < 3; ++api) { printf ("\n** running %s tests for %s...\n", kTypeName[type], kAPIName[api]); StringVector inputFiles = GetFiles (testFolder, kApiIn[api]); size_t n = inputFiles.size(); for (size_t i = 0; i < n; ++i) { std::string inname = inputFiles[i]; //if (inname != "ast-in.txt") // continue; std::string outname = inname.substr (0,inname.size()-strlen(kApiIn[api])) + kApiOut[api]; std::string outnameMetal = inname.substr (0,inname.size()-strlen(kApiIn[api])) + kApiOutMetal[api]; const bool useMetal = (api == 1); bool ok = TestFile (ctx[api], type==0, inname, testFolder + "/" + inname, testFolder + "/" + outname, api<=1, hasOpenGL, false); if (!ok) { ++errors; } if (useMetal) { ok = TestFile (ctxMetal, type==0, inname, testFolder + "/" + inname, testFolder + "/" + outnameMetal, api==0, false, hasMetal); if (!ok) { ++errors; } } ++tests; } } } clock_t time1 = clock(); float timeDelta = float(time1-time0)/CLOCKS_PER_SEC; if (errors != 0) printf ("\n**** %i tests (%.2fsec), %i !!!FAILED!!!\n", (int)tests, timeDelta, (int)errors); else printf ("\n**** %i tests (%.2fsec) succeeded\n", (int)tests, timeDelta); // 3.25s // with builtin call linking, 3.84s for (int i = 0; i < 2; ++i) glslopt_cleanup (ctx[i]); glslopt_cleanup (ctxMetal); CleanupGL(); return errors ? 1 : 0; }