// // Copyright (c) 2017 The Khronos Group Inc. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. // #include "../../test_common/harness/compat.h" #include #include #include #if ! defined( _WIN32) #if ! defined( __ANDROID__ ) #include #endif #include #define streamDup(fd1) dup(fd1) #define streamDup2(fd1,fd2) dup2(fd1,fd2) #endif #include #include "test_printf.h" #if defined(_WIN32) #include #define streamDup(fd1) _dup(fd1) #define streamDup2(fd1,fd2) _dup2(fd1,fd2) #endif #include "../../test_common/harness/testHarness.h" #include "../../test_common/harness/errorHelpers.h" #include "../../test_common/harness/kernelHelpers.h" #include "../../test_common/harness/mt19937.h" typedef unsigned int uint32_t; //----------------------------------------- // Static helper functions declaration //----------------------------------------- static void printUsage( void ); //Stream helper functions //Associate stdout stream with the file(/tmp/tmpfile):i.e redirect stdout stream to the specific files (/tmp/tmpfile) static int acquireOutputStream(); //Close the file(/tmp/tmpfile) associated with the stdout stream and disassociates it. static void releaseOutputStream(int fd); //Get analysis buffer to verify the correctess of printed data static void getAnalysisBuffer(char* analysisBuffer); //Kernel builder helper functions //Check if the test case is for kernel that has argument static int isKernelArgument(testCase* pTestCase,size_t testId); //Check if the test case treats %p format for void* static int isKernelPFormat(testCase* pTestCase,size_t testId); //----------------------------------------- // Static functions declarations //----------------------------------------- // Make a program that uses printf for the given type/format, static cl_program makePrintfProgram(cl_kernel *kernel_ptr, const cl_context context,const unsigned int testId,const unsigned int testNum,bool isLongSupport = true,bool is64bAddrSpace = false); // Creates and execute the printf test for the given device, context, type/format static int doTest(cl_command_queue queue, cl_context context, const unsigned int testId, const unsigned int testNum, cl_device_id device); // Check if device supports long static bool isLongSupported(cl_device_id device_id); // Check if device address space is 64 bits static bool is64bAddressSpace(cl_device_id device_id); //Wait until event status is CL_COMPLETE int waitForEvent(cl_event* event); //----------------------------------------- // Definitions and initializations //----------------------------------------- // Tests are broken into the major test which is based on the // src and cmp type and their corresponding vector types and // sub tests which is for each individual test. The following // tracks the subtests int s_test_cnt = 0; int s_test_fail = 0; static cl_device_id gDevice; static cl_context gContext; static cl_command_queue gQueue; static int gFd; //----------------------------------------- // Static helper functions definition //----------------------------------------- //----------------------------------------- // acquireOutputStream //----------------------------------------- static int acquireOutputStream() { int fd = streamDup(fileno(stdout)); #if (defined(__linux__) || defined(__APPLE__)) && (!defined( __ANDROID__ )) freopen("/tmp/tmpfile","w",stdout); #else freopen("tmpfile","w",stdout); #endif return fd; } //----------------------------------------- // releaseOutputStream //----------------------------------------- static void releaseOutputStream(int fd) { fflush(stdout); streamDup2(fd,fileno(stdout)); close(fd); } //----------------------------------------- // getAnalysisBuffer //----------------------------------------- static void getAnalysisBuffer(char* analysisBuffer) { FILE *fp; memset(analysisBuffer,0,ANALYSIS_BUFFER_SIZE); #if (defined(__linux__) || defined(__APPLE__)) && (!defined( __ANDROID__ )) fp = fopen("/tmp/tmpfile","r"); #else fp = fopen("tmpfile","r"); #endif if(NULL == fp) log_error("Failed to open analysis buffer ('%s')\n", strerror(errno)); else while(fgets(analysisBuffer,ANALYSIS_BUFFER_SIZE , fp) != NULL ); fclose(fp); } //----------------------------------------- // isKernelArgument //----------------------------------------- static int isKernelArgument(testCase* pTestCase,size_t testId) { return strcmp(pTestCase->_genParameters[testId].addrSpaceArgumentTypeQualifier,""); } //----------------------------------------- // isKernelPFormat //----------------------------------------- static int isKernelPFormat(testCase* pTestCase,size_t testId) { return strcmp(pTestCase->_genParameters[testId].addrSpacePAdd,""); } //----------------------------------------- // waitForEvent //----------------------------------------- int waitForEvent(cl_event* event) { cl_int status = CL_SUCCESS; cl_int eventStatus = CL_QUEUED; while(eventStatus != CL_COMPLETE) { status = clGetEventInfo( *event, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(cl_int), &eventStatus, NULL); if(status != CL_SUCCESS) { log_error("clGetEventInfo failed"); return status; } } status = clReleaseEvent(*event); if(status != CL_SUCCESS) { log_error("clReleaseEvent failed. (*event)"); return status; } return CL_SUCCESS; } //----------------------------------------- // Static helper functions definition //----------------------------------------- //----------------------------------------- // makePrintfProgram //----------------------------------------- static cl_program makePrintfProgram(cl_kernel *kernel_ptr, const cl_context context,const unsigned int testId,const unsigned int testNum,bool isLongSupport,bool is64bAddrSpace) { int err,i; cl_program program; cl_device_id devID; char buildLog[ 1024 * 128 ]; char testname[256] = {0}; char addrSpaceArgument[256] = {0}; char addrSpacePAddArgument[256] = {0}; //Program Source code for int,float,octal,hexadecimal,char,string const char *sourceGen[] = { "__kernel void ", testname, "(void)\n", "{\n" " printf(\"", allTestCase[testId]->_genParameters[testNum].genericFormat, "\\n\",", allTestCase[testId]->_genParameters[testNum].dataRepresentation, ");", "}\n" }; //Program Source code for vector const char *sourceVec[] = { "__kernel void ", testname, "(void)\n", "{\n", allTestCase[testId]->_genParameters[testNum].dataType, allTestCase[testId]->_genParameters[testNum].vectorSize, " tmp = (", allTestCase[testId]->_genParameters[testNum].dataType, allTestCase[testId]->_genParameters[testNum].vectorSize, ")", allTestCase[testId]->_genParameters[testNum].dataRepresentation, ";", " printf(\"", allTestCase[testId]->_genParameters[testNum].vectorFormatFlag, "v", allTestCase[testId]->_genParameters[testNum].vectorSize, allTestCase[testId]->_genParameters[testNum].vectorFormatSpecifier, "\\n\",", "tmp);", "}\n" }; //Program Source code for address space const char *sourceAddrSpace[] = { "__kernel void ", testname,"(",addrSpaceArgument, ")\n{\n", allTestCase[testId]->_genParameters[testNum].addrSpaceVariableTypeQualifier, "printf(", allTestCase[testId]->_genParameters[testNum].genericFormat, ",", allTestCase[testId]->_genParameters[testNum].addrSpaceParameter, "); ", addrSpacePAddArgument, "\n}\n" }; //Update testname sprintf(testname,"%s%d","test",testId); //Update addrSpaceArgument and addrSpacePAddArgument types, based on FULL_PROFILE/EMBEDDED_PROFILE if(allTestCase[testId]->_type == TYPE_ADDRESS_SPACE) { sprintf(addrSpaceArgument, "%s",allTestCase[testId]->_genParameters[testNum].addrSpaceArgumentTypeQualifier); sprintf(addrSpacePAddArgument,allTestCase[testId]->_genParameters[testNum].addrSpacePAdd); } if (strlen(addrSpaceArgument) == 0) sprintf(addrSpaceArgument,"void"); // create program based on its type if(allTestCase[testId]->_type == TYPE_VECTOR) { program = clCreateProgramWithSource( context,sizeof(sourceVec)/sizeof(sourceVec[0]),sourceVec, NULL, NULL); } else if(allTestCase[testId]->_type == TYPE_ADDRESS_SPACE) { program = clCreateProgramWithSource( context,sizeof(sourceAddrSpace)/sizeof(sourceAddrSpace[0]),sourceAddrSpace, NULL, NULL); } else { program = clCreateProgramWithSource( context,sizeof(sourceGen)/sizeof(sourceGen[0]),sourceGen, NULL, NULL); } if (!program) { log_error("clCreateProgramWithSource failed\n"); return NULL; } err = clBuildProgram(program, 0, NULL, NULL, NULL, NULL); if (err != CL_SUCCESS) { log_error("clBuildProgramExecutable failed errcode:%d\n", err); err = clGetProgramInfo( program, CL_PROGRAM_DEVICES, sizeof( devID ), &devID, NULL ); if (err){ log_error("Unable to get program's device: %d\n",err ); return NULL; } err = clGetProgramBuildInfo( program, devID, CL_PROGRAM_BUILD_LOG, sizeof( buildLog ), buildLog, NULL ); if (err){ log_error("Unable to get program's build log: %d\n",err ); return NULL; } size_t sourceLen; const char** source; if(allTestCase[testId]->_type == TYPE_VECTOR) { sourceLen = sizeof(sourceVec) / sizeof( sourceVec[0] ); source = sourceVec; } else if(allTestCase[testId]->_type == TYPE_ADDRESS_SPACE) { sourceLen = sizeof(sourceAddrSpace) / sizeof( sourceAddrSpace[0] ); source = sourceAddrSpace; } else { sourceLen = sizeof(sourceGen) / sizeof( sourceGen[0] ); source = sourceGen; } log_error( "Build log is: ------------\n" ); log_error( "%s\n", buildLog ); log_error( "----------\n" ); log_error( " Source is ----------------\n"); for(i = 0; i < sourceLen; ++i) { log_error("%s", source[i]); } log_error( "----------\n" ); return NULL; } *kernel_ptr = clCreateKernel(program, testname, &err); if ( err ) { log_error("clCreateKernel failed (%d)\n", err); return NULL; } return program; } //----------------------------------------- // isLongSupported //----------------------------------------- static bool isLongSupported(cl_device_id device_id) { size_t tempSize = 0; cl_int status; bool extSupport = true; // Device profile status = clGetDeviceInfo( device_id, CL_DEVICE_PROFILE, 0, NULL, &tempSize); if(status != CL_SUCCESS) { log_error("*** clGetDeviceInfo FAILED ***\n\n"); return false; } std::unique_ptr profileType(new char[tempSize]); if(profileType == NULL) { log_error("Failed to allocate memory(profileType)"); return false; } status = clGetDeviceInfo( device_id, CL_DEVICE_PROFILE, sizeof(char) * tempSize, profileType.get(), NULL); if(!strcmp("EMBEDDED_PROFILE",profileType.get())) { // Device extention status = clGetDeviceInfo( device_id, CL_DEVICE_EXTENSIONS, 0, NULL, &tempSize); if(status != CL_SUCCESS) { log_error("*** clGetDeviceInfo FAILED ***\n\n"); return false; } std::unique_ptr devExt(new char[tempSize]); if(devExt == NULL) { log_error("Failed to allocate memory(devExt)"); return false; } status = clGetDeviceInfo( device_id, CL_DEVICE_EXTENSIONS, sizeof(char) * tempSize, devExt.get(), NULL); extSupport = (strstr(devExt.get(),"cles_khr_int64") != NULL); } return extSupport; } //----------------------------------------- // is64bAddressSpace //----------------------------------------- static bool is64bAddressSpace(cl_device_id device_id) { cl_int status; cl_uint addrSpaceB; // Device profile status = clGetDeviceInfo( device_id, CL_DEVICE_ADDRESS_BITS, sizeof(cl_uint), &addrSpaceB, NULL); if(status != CL_SUCCESS) { log_error("*** clGetDeviceInfo FAILED ***\n\n"); return false; } if(addrSpaceB == 64) return true; else return false; } //----------------------------------------- // doTest //----------------------------------------- static int doTest(cl_command_queue queue, cl_context context, const unsigned int testId, const unsigned int testNum, cl_device_id device) { if(allTestCase[testId]->_type == TYPE_VECTOR) { log_info("%d)testing printf(\"%sv%s%s\",%s)\n",testNum,allTestCase[testId]->_genParameters[testNum].vectorFormatFlag,allTestCase[testId]->_genParameters[testNum].vectorSize, allTestCase[testId]->_genParameters[testNum].vectorFormatSpecifier,allTestCase[testId]->_genParameters[testNum].dataRepresentation); } else if(allTestCase[testId]->_type == TYPE_ADDRESS_SPACE) { if(isKernelArgument(allTestCase[testId], testNum)) { log_info("%d)testing kernel //argument %s \n printf(%s,%s)\n",testNum,allTestCase[testId]->_genParameters[testNum].addrSpaceArgumentTypeQualifier, allTestCase[testId]->_genParameters[testNum].genericFormat,allTestCase[testId]->_genParameters[testNum].addrSpaceParameter); } else { log_info("%d)testing kernel //variable %s \n printf(%s,%s)\n",testNum,allTestCase[testId]->_genParameters[testNum].addrSpaceVariableTypeQualifier, allTestCase[testId]->_genParameters[testNum].genericFormat,allTestCase[testId]->_genParameters[testNum].addrSpaceParameter); } } else { log_info("%d)testing printf(\"%s\",%s)\n",testNum,allTestCase[testId]->_genParameters[testNum].genericFormat,allTestCase[testId]->_genParameters[testNum].dataRepresentation); } // Long support for varible type if(allTestCase[testId]->_type == TYPE_VECTOR && !strcmp(allTestCase[testId]->_genParameters[testNum].dataType,"long") && !isLongSupported(device)) { log_info( "Long is not supported, test not run.\n" ); return 0; } // Long support for address in FULL_PROFILE/EMBEDDED_PROFILE bool isLongSupport = true; if(allTestCase[testId]->_type == TYPE_ADDRESS_SPACE && isKernelPFormat(allTestCase[testId],testNum) && !isLongSupported(device)) { isLongSupport = false; } gFd = acquireOutputStream(); int err; cl_program program; cl_kernel kernel; cl_mem d_out = NULL; cl_mem d_a = NULL; char _analysisBuffer[ANALYSIS_BUFFER_SIZE]; cl_uint out32 = 0; cl_ulong out64 = 0; // Define an index space (global work size) of threads for execution. size_t globalWorkSize[1]; program = makePrintfProgram(&kernel, context,testId,testNum,isLongSupport,is64bAddressSpace(device)); if (!program || !kernel) { ++s_test_fail; ++s_test_cnt; releaseOutputStream(gFd); return -1; } //For address space test if there is kernel argument - set it if(allTestCase[testId]->_type == TYPE_ADDRESS_SPACE ) { if(isKernelArgument(allTestCase[testId],testNum)) { int a = 2; d_a = clCreateBuffer(context, CL_MEM_READ_ONLY|CL_MEM_COPY_HOST_PTR, sizeof(int), &a, &err); if(err!= CL_SUCCESS || d_a == NULL) { log_error("clCreateBuffer failed\n"); goto exit; } err = clSetKernelArg(kernel, 0, sizeof(cl_mem), &d_a); if(err!= CL_SUCCESS) { log_error("clSetKernelArg failed\n"); goto exit; } } //For address space test if %p is tested if(isKernelPFormat(allTestCase[testId],testNum)) { d_out = clCreateBuffer(context, CL_MEM_READ_WRITE, sizeof(cl_ulong), NULL, &err); if(err!= CL_SUCCESS || d_out == NULL) { log_error("clCreateBuffer failed\n"); goto exit; } err = clSetKernelArg(kernel, 1, sizeof(cl_mem), &d_out); if(err!= CL_SUCCESS) { log_error("clSetKernelArg failed\n"); goto exit; } } } globalWorkSize[0] = 1; cl_event ndrEvt; err = clEnqueueNDRangeKernel(queue, kernel, 1, NULL, globalWorkSize, NULL, 0, NULL,&ndrEvt); if (err != CL_SUCCESS) { log_error("\n clEnqueueNDRangeKernel failed errcode:%d\n", err); ++s_test_fail; goto exit; } fflush(stdout); err = clFlush(queue); if(err != CL_SUCCESS) { log_error("clFlush failed\n"); goto exit; } //Wait until kernel finishes its execution and (thus) the output printed from the kernel //is immidatly printed err = waitForEvent(&ndrEvt); if(err != CL_SUCCESS) { log_error("waitforEvent failed\n"); goto exit; } fflush(stdout); if(allTestCase[testId]->_type == TYPE_ADDRESS_SPACE && isKernelPFormat(allTestCase[testId],testNum)) { // Read the OpenCL output buffer (d_out) to the host output array (out) if(!is64bAddressSpace(device))//32-bit address space { clEnqueueReadBuffer(queue, d_out, CL_TRUE, 0, sizeof(cl_int),&out32, 0, NULL, NULL); } else //64-bit address space { clEnqueueReadBuffer(queue, d_out, CL_TRUE, 0, sizeof(cl_ulong),&out64, 0, NULL, NULL); } } // //Get the output printed from the kernel to _analysisBuffer //and verify its correctness getAnalysisBuffer(_analysisBuffer); if(!is64bAddressSpace(device)) //32-bit address space { if(0 != verifyOutputBuffer(_analysisBuffer,allTestCase[testId],testNum,(cl_ulong) out32)) err = ++s_test_fail; } else //64-bit address space { if(0 != verifyOutputBuffer(_analysisBuffer,allTestCase[testId],testNum,out64)) err = ++s_test_fail; } exit: if(clReleaseKernel(kernel) != CL_SUCCESS) log_error("clReleaseKernel failed\n"); if(clReleaseProgram(program) != CL_SUCCESS) log_error("clReleaseProgram failed\n"); if(d_out) clReleaseMemObject(d_out); if(d_a) clReleaseMemObject(d_a); ++s_test_cnt; releaseOutputStream(gFd); return err; } //----------------------------------------- // printArch //----------------------------------------- static void printArch( void ) { log_info( "sizeof( void*) = %d\n", (int) sizeof( void *) ); #if defined( __APPLE__ ) #if defined( __ppc__ ) log_info( "ARCH:\tppc\n" ); #elif defined( __ppc64__ ) log_info( "ARCH:\tppc64\n" ); #elif defined( __i386__ ) log_info( "ARCH:\ti386\n" ); #elif defined( __x86_64__ ) log_info( "ARCH:\tx86_64\n" ); #elif defined( __arm__ ) log_info( "ARCH:\tarm\n" ); #elif defined( __aarch64__ ) log_info( "ARCH:\taarch64\n" ); #else #error unknown arch #endif int type = 0; size_t typeSize = sizeof( type ); sysctlbyname( "hw.cputype", &type, &typeSize, NULL, 0 ); log_info( "cpu type:\t%d\n", type ); typeSize = sizeof( type ); sysctlbyname( "hw.cpusubtype", &type, &typeSize, NULL, 0 ); log_info( "cpu subtype:\t%d\n", type ); #endif } int test_int_0(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_INT, 0, gDevice); } int test_int_1(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_INT, 1, gDevice); } int test_int_2(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_INT, 2, gDevice); } int test_int_3(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_INT, 3, gDevice); } int test_int_4(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_INT, 4, gDevice); } int test_int_5(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_INT, 5, gDevice); } int test_int_6(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_INT, 6, gDevice); } int test_int_7(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_INT, 7, gDevice); } int test_int_8(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_INT, 8, gDevice); } int test_float_0(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 0, gDevice); } int test_float_1(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 1, gDevice); } int test_float_2(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 2, gDevice); } int test_float_3(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 3, gDevice); } int test_float_4(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 4, gDevice); } int test_float_5(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 5, gDevice); } int test_float_6(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 6, gDevice); } int test_float_7(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 7, gDevice); } int test_float_8(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 8, gDevice); } int test_float_9(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 9, gDevice); } int test_float_10(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 10, gDevice); } int test_float_11(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 11, gDevice); } int test_float_12(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 12, gDevice); } int test_float_13(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 13, gDevice); } int test_float_14(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 14, gDevice); } int test_float_15(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 15, gDevice); } int test_float_16(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 16, gDevice); } int test_float_17(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 17, gDevice); } int test_float_18(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 18, gDevice); } int test_float_19(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 19, gDevice); } int test_float_20(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_FLOAT, 20, gDevice); } int test_octal_0(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_OCTAL, 0, gDevice); } int test_octal_1(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_OCTAL, 1, gDevice); } int test_octal_2(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_OCTAL, 2, gDevice); } int test_octal_3(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_OCTAL, 3, gDevice); } int test_unsigned_0(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_UNSIGNED, 0, gDevice); } int test_unsigned_1(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_UNSIGNED, 1, gDevice); } int test_hexadecimal_0(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_HEXADEC, 0, gDevice); } int test_hexadecimal_1(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_HEXADEC, 1, gDevice); } int test_hexadecimal_2(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_HEXADEC, 2, gDevice); } int test_hexadecimal_3(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_HEXADEC, 3, gDevice); } int test_hexadecimal_4(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_HEXADEC, 4, gDevice); } int test_char_0(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_CHAR, 0, gDevice); } int test_char_1(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_CHAR, 1, gDevice); } int test_char_2(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_CHAR, 2, gDevice); } int test_string_0(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_STRING, 0, gDevice); } int test_string_1(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_STRING, 1, gDevice); } int test_string_2(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_STRING, 2, gDevice); } int test_vector_0(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_VECTOR, 0, gDevice); } int test_vector_1(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_VECTOR, 1, gDevice); } int test_vector_2(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_VECTOR, 2, gDevice); } int test_vector_3(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_VECTOR, 3, gDevice); } int test_vector_4(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_VECTOR, 4, gDevice); } int test_address_space_0(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_ADDRESS_SPACE, 0, gDevice); } int test_address_space_1(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_ADDRESS_SPACE, 1, gDevice); } int test_address_space_2(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_ADDRESS_SPACE, 2, gDevice); } int test_address_space_3(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_ADDRESS_SPACE, 3, gDevice); } int test_address_space_4(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { return doTest(gQueue, gContext, TYPE_ADDRESS_SPACE, 4, gDevice); } basefn basefn_list[] = { test_int_0, test_int_1, test_int_2, test_int_3, test_int_4, test_int_5, test_int_6, test_int_7, test_int_8, test_float_0, test_float_1, test_float_2, test_float_3, test_float_4, test_float_5, test_float_6, test_float_7, test_float_8, test_float_9, test_float_10, test_float_11, test_float_12, test_float_13, test_float_14, test_float_15, test_float_16, test_float_17, test_float_18, test_float_19, test_float_20, test_octal_0, test_octal_1, test_octal_2, test_octal_3, test_unsigned_0, test_unsigned_1, test_hexadecimal_0, test_hexadecimal_1, test_hexadecimal_2, test_hexadecimal_3, test_hexadecimal_4, test_char_0, test_char_1, test_char_2, test_string_0, test_string_1, test_string_2, test_vector_0, test_vector_1, test_vector_2, test_vector_3, test_vector_4, test_address_space_0, test_address_space_1, test_address_space_2, test_address_space_3, test_address_space_4, }; const char *basefn_names[] = { "int_0", "int_1", "int_2", "int_3", "int_4", "int_5", "int_6", "int_7", "int_8", "float_0", "float_1", "float_2", "float_3", "float_4", "float_5", "float_6", "float_7", "float_8", "float_9", "float_10", "float_11", "float_12", "float_13", "float_14", "float_15", "float_16", "float_17", "float_18", "float_19", "float_20", "octal_0", "octal_1", "octal_2", "octal_3", "unsigned_0", "unsigned_1", "hexadecimal_0", "hexadecimal_1", "hexadecimal_2", "hexadecimal_3", "hexadecimal_4", "char_0", "char_1", "char_2", "string_0", "string_1", "string_2", "vector_0", "vector_1", "vector_2", "vector_3", "vector_4", "address_space_0", "address_space_1", "address_space_2", "address_space_3", "address_space_4", }; ct_assert((sizeof(basefn_names) / sizeof(basefn_names[0])) == (sizeof(basefn_list) / sizeof(basefn_list[0]))); int num_fns = sizeof(basefn_names) / sizeof(char *); //----------------------------------------- // main //----------------------------------------- int main(int argc, char* argv[]) { int i; cl_device_type device_type = CL_DEVICE_TYPE_DEFAULT; cl_platform_id platform_id; uint32_t device_frequency = 0; uint32_t compute_devices = 0; test_start(); // Check the environmental to see if there is device preference char *device_env = getenv("CL_DEVICE_TYPE"); if (device_env != NULL) { if( strcmp( device_env, "gpu" ) == 0 || strcmp( device_env, "CL_DEVICE_TYPE_GPU" ) == 0 ) device_type = CL_DEVICE_TYPE_GPU; else if( strcmp( device_env, "cpu" ) == 0 || strcmp( device_env, "CL_DEVICE_TYPE_CPU" ) == 0 ) device_type = CL_DEVICE_TYPE_CPU; else if( strcmp( device_env, "accelerator" ) == 0 || strcmp( device_env, "CL_DEVICE_TYPE_ACCELERATOR" ) == 0 ) device_type = CL_DEVICE_TYPE_ACCELERATOR; else if( strcmp( device_env, "default" ) == 0 || strcmp( device_env, "CL_DEVICE_TYPE_DEFAULT" ) == 0 ) device_type = CL_DEVICE_TYPE_DEFAULT; else { log_error( "Unknown CL_DEVICE_TYPE environment variable: %s.\nAborting...\n", device_env ); abort(); } } const char ** argList = (const char **)calloc( argc, sizeof( char*) ); if( NULL == argList ) { log_error( "Failed to allocate memory for argList array.\n" ); return 1; } argList[0] = argv[0]; size_t argCount = 1; for (i=1; i < argc; ++i) { const char *arg = argv[i]; if (arg == NULL) break; if (arg[0] == '-') { arg++; while(*arg != '\0') { switch(*arg) { case 'h': printUsage(); return 0; default: log_error( " <-- unknown flag: %c (0x%2.2x)\n)", *arg, *arg ); printUsage(); return 0; } arg++; } } else { if( 0 == strcmp( argv[i], "CL_DEVICE_TYPE_CPU" ) ) device_type = CL_DEVICE_TYPE_CPU; else if( 0 == strcmp( argv[i], "CL_DEVICE_TYPE_GPU" ) ) device_type = CL_DEVICE_TYPE_GPU; else if( 0 == strcmp( argv[i], "CL_DEVICE_TYPE_ACCELERATOR" ) ) device_type = CL_DEVICE_TYPE_ACCELERATOR; else if( 0 == strcmp( argv[i], "CL_DEVICE_TYPE_DEFAULT" ) ) device_type = CL_DEVICE_TYPE_DEFAULT; else { argList[argCount] = arg; argCount++; } } } int err; gFd = acquireOutputStream(); // Get platform err = clGetPlatformIDs(1, &platform_id, NULL); checkErr(err,"clGetPlatformIDs failed"); // Get Device information err = clGetDeviceIDs(platform_id, device_type, 1, &gDevice, 0); checkErr(err,"clGetComputeDevices"); err = clGetDeviceInfo(gDevice, CL_DEVICE_TYPE, sizeof(cl_device_type), &device_type, NULL); checkErr(err,"clGetComputeConfigInfo 1"); size_t config_size = sizeof( device_frequency ); #if MULTITHREAD if( (err = clGetDeviceInfo(gDevice, CL_DEVICE_MAX_COMPUTE_UNITS, config_size, &compute_devices, NULL )) ) #endif compute_devices = 1; config_size = sizeof(device_frequency); if((err = clGetDeviceInfo(gDevice, CL_DEVICE_MAX_CLOCK_FREQUENCY, config_size, &device_frequency, NULL ))) device_frequency = 1; releaseOutputStream(gFd); log_info( "\nCompute Device info:\n" ); log_info( "\tProcessing with %d devices\n", compute_devices ); log_info( "\tDevice Frequency: %d MHz\n", device_frequency ); printDeviceHeader( gDevice ); printArch(); err = check_opencl_version(gDevice,1,2); if( err != CL_SUCCESS ) { print_missing_feature(err,"printf"); test_finish(); return err; } log_info( "Test binary built %s %s\n", __DATE__, __TIME__ ); gFd = acquireOutputStream(); gContext = clCreateContext(NULL, 1, &gDevice, notify_callback, NULL, NULL); checkNull(gContext, "clCreateContext"); gQueue = clCreateCommandQueueWithProperties(gContext, gDevice, 0, NULL); checkNull(gQueue, "clCreateCommandQueue"); releaseOutputStream(gFd); err = parseAndCallCommandLineTests( argCount, argList, NULL, num_fns, basefn_list, basefn_names, true, 0, 0 ); if(gQueue) { int error = clFinish(gQueue); if (error) { log_error("clFinish failed: %d\n", error); } } if(clReleaseCommandQueue(gQueue)!=CL_SUCCESS) log_error("clReleaseCommandQueue\n"); if(clReleaseContext(gContext)!= CL_SUCCESS) log_error("clReleaseContext\n"); releaseOutputStream(gFd); free(argList); test_finish(); return err; } //----------------------------------------- // printUsage //----------------------------------------- static void printUsage( void ) { log_info("test_printf: \n"); log_info("\tdefault is to run the full test on the default device\n"); log_info("\n"); for( int i = 0; i < num_fns; i++ ) { log_info( "\t%s\n", basefn_names[i] ); } }