// // Copyright (c) 2017 The Khronos Group Inc. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. // #include "../../test_common/harness/compat.h" #include #include #include #include #include #include "procs.h" #include "../../test_common/harness/errorHelpers.h" #define STRING_LENGTH 1024 void createKernelSourceCode(char *source, int num_pipes) { int i; char str[256]; int str_length; strcpy(source, "__kernel void test_multiple_pipe_write(__global int *src, "); for(i = 0; i < num_pipes; i++) { sprintf(str, "__write_only pipe int pipe%d, ", i); strcat(source, str); } sprintf(str, "int num_pipes ) \n{\n int gid = get_global_id(0);\n reserve_id_t res_id;\n\n"); strcat(source, str); sprintf(str, " if(gid < (get_global_size(0))/num_pipes)\n {\n res_id = reserve_write_pipe(pipe0, 1);\n if(is_valid_reserve_id(res_id))\n {\n"); strcat(source, str); sprintf(str, " write_pipe(pipe0, res_id, 0, &src[gid]);\n commit_write_pipe(pipe0, res_id);\n }\n }\n"); strcat(source, str); for(i = 1; i < num_pipes; i++){ sprintf(str, " else if(gid < (%d*get_global_size(0))/num_pipes)\n {\n res_id = reserve_write_pipe(pipe%d, 1);\n if(is_valid_reserve_id(res_id))\n {\n", i+1, i); strcat(source, str); sprintf(str, " write_pipe(pipe%d, res_id, 0, &src[gid]);\n commit_write_pipe(pipe%d, res_id);\n }\n }\n", i, i); strcat(source, str); } strcat(source, "}\n\n__kernel void test_multiple_pipe_read(__global int *dst, "); for(i = 0; i < num_pipes; i++) { sprintf(str, "__read_only pipe int pipe%d, ", i); strcat(source, str); } sprintf(str, "int num_pipes ) \n{\n int gid = get_global_id(0);\n reserve_id_t res_id;\n\n"); strcat(source, str); sprintf(str, " if(gid < (get_global_size(0))/num_pipes)\n {\n res_id = reserve_read_pipe(pipe0, 1);\n if(is_valid_reserve_id(res_id))\n {\n"); strcat(source, str); sprintf(str, " read_pipe(pipe0, res_id, 0, &dst[gid]);\n commit_read_pipe(pipe0, res_id);\n }\n }\n"); strcat(source, str); for(i = 1; i < num_pipes; i++){ sprintf(str, " else if(gid < (%d*get_global_size(0))/num_pipes)\n {\n res_id = reserve_read_pipe(pipe%d, 1);\n if(is_valid_reserve_id(res_id))\n {\n", i+1, i); strcat(source, str); sprintf(str, " read_pipe(pipe%d, res_id, 0, &dst[gid]);\n commit_read_pipe(pipe%d, res_id);\n }\n }\n", i, i); strcat(source, str); } strcat(source, "}"); str_length = strlen(source); assert(str_length <= STRING_LENGTH*num_pipes); } static int verify_result(void *ptr1, void *ptr2, int n) { int i; int sum_input = 0, sum_output = 0; cl_char *inptr = (cl_char *)ptr1; cl_char *outptr = (cl_char *)ptr2; for(i = 0; i < n; i++) { sum_input += inptr[i]; sum_output += outptr[i]; } if(sum_input != sum_output){ return -1; } return 0; } static int verify_result_int(void *ptr1, void *ptr2, int n) { int i; int sum_input = 0, sum_output = 0; cl_int *inptr = (cl_int *)ptr1; cl_int *outptr = (cl_int *)ptr2; for(i = 0; i < n; i++) { sum_input += inptr[i]; sum_output += outptr[i]; } if(sum_input != sum_output){ return -1; } return 0; } int test_pipe_max_args(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { cl_mem pipes[1024]; cl_mem buffers[2]; void *outptr; cl_int *inptr; cl_program program; cl_kernel kernel[2]; size_t global_work_size[3]; cl_int err; cl_int size; int num_pipe_elements = 1024; int i, j; int max_pipe_args; char *source; cl_event producer_sync_event = NULL; cl_event consumer_sync_event = NULL; MTdata d = init_genrand( gRandomSeed ); const char* kernelName[] = {"test_multiple_pipe_write", "test_multiple_pipe_read"}; size_t min_alignment = get_min_alignment(context); err = clGetDeviceInfo(deviceID, CL_DEVICE_MAX_PIPE_ARGS, sizeof(max_pipe_args), (void*)&max_pipe_args, NULL); if(err){ print_error(err, " clGetDeviceInfo failed\n"); return -1; } if(max_pipe_args < 16){ log_error("The device should support minimum 16 pipe objects that could be passed as arguments to the kernel"); return -1; } global_work_size[0] = (cl_uint)num_pipe_elements * max_pipe_args; size = sizeof(int) * num_pipe_elements * max_pipe_args; source = (char *)malloc(STRING_LENGTH * sizeof(char) * max_pipe_args); inptr = (cl_int *)align_malloc(size, min_alignment); for(i = 0; i < num_pipe_elements * max_pipe_args; i++){ inptr[i] = (int)genrand_int32(d); } buffers[0] = clCreateBuffer(context, CL_MEM_COPY_HOST_PTR, size, inptr, &err); if(err){ clReleaseMemObject(buffers[0]); free(source); print_error(err, " clCreateBuffer failed\n"); return -1; } outptr = align_malloc(size, min_alignment); buffers[1] = clCreateBuffer(context, CL_MEM_USE_HOST_PTR, size, outptr, &err); if ( err ){ clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free( outptr ); free(source); print_error(err, " clCreateBuffer failed\n" ); return -1; } for(i = 0; i < max_pipe_args; i++){ pipes[i] = clCreatePipe(context, CL_MEM_HOST_NO_ACCESS, sizeof(int), num_pipe_elements, NULL, &err); if(err){ clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free( outptr ); free(source); for(j = 0; j < i; j++) { clReleaseMemObject(pipes[j]); } print_error(err, " clCreatePipe failed\n"); return -1; } } createKernelSourceCode(source, max_pipe_args); // Create producer kernel err = create_single_kernel_helper_with_build_options(context, &program, &kernel[0], 1, (const char**)&source, kernelName[0], "-cl-std=CL2.0"); if(err){ clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); for(j = 0; j < max_pipe_args; j++) { clReleaseMemObject(pipes[j]); } align_free(outptr); free(source); print_error(err, "Error creating program\n"); return -1; } //Create consumer kernel kernel[1] = clCreateKernel(program, kernelName[1], &err); if( kernel[1] == NULL || err != CL_SUCCESS) { clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); for(j = 0; j < max_pipe_args; j++) { clReleaseMemObject(pipes[j]); } align_free(outptr); free(source); print_error(err, " Error creating kernel\n"); return -1; } err = clSetKernelArg(kernel[0], 0, sizeof(cl_mem), (void*)&buffers[0]); for( i = 0; i < max_pipe_args; i++){ err |= clSetKernelArg(kernel[0], i+1, sizeof(cl_mem), (void*)&pipes[i]); } err |= clSetKernelArg(kernel[0], max_pipe_args + 1, sizeof(int), (void*)&max_pipe_args); err |= clSetKernelArg(kernel[1], 0, sizeof(cl_mem), (void*)&buffers[1]); for( i = 0; i < max_pipe_args; i++){ err |= clSetKernelArg(kernel[1], i+1, sizeof(cl_mem), (void*)&pipes[i]); } err |= clSetKernelArg(kernel[1], max_pipe_args + 1, sizeof(int), (void*)&max_pipe_args); if ( err != CL_SUCCESS ){ clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); for(j = 0; j < max_pipe_args; j++) { clReleaseMemObject(pipes[j]); } clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseProgram(program); align_free(outptr); free(source); print_error(err, " clSetKernelArg failed"); return -1; } // Launch Producer kernel err = clEnqueueNDRangeKernel( queue, kernel[0], 1, NULL, global_work_size, NULL, 0, NULL, &producer_sync_event ); if ( err != CL_SUCCESS ){ print_error( err, " clEnqueueNDRangeKernel failed" ); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); for(j = 0; j < max_pipe_args; j++) { clReleaseMemObject(pipes[j]); } clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseEvent(producer_sync_event); clReleaseEvent(consumer_sync_event); clReleaseProgram(program); align_free(outptr); free(source); return -1; } // Launch Consumer kernel err = clEnqueueNDRangeKernel( queue, kernel[1], 1, NULL, global_work_size, NULL, 1, &producer_sync_event, &consumer_sync_event ); if ( err != CL_SUCCESS ){ print_error( err, " clEnqueueNDRangeKernel failed" ); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); for(j = 0; j < max_pipe_args; j++) { clReleaseMemObject(pipes[j]); } clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseEvent(producer_sync_event); clReleaseEvent(consumer_sync_event); clReleaseProgram(program); align_free(outptr); free(source); return -1; } err = clEnqueueReadBuffer(queue, buffers[1], true, 0, size, outptr, 1, &consumer_sync_event, NULL); if ( err != CL_SUCCESS ){ print_error( err, " clEnqueueReadBuffer failed" ); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); for(j = 0; j < max_pipe_args; j++) { clReleaseMemObject(pipes[j]); } clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseEvent(producer_sync_event); clReleaseEvent(consumer_sync_event); clReleaseProgram(program); align_free(outptr); free(source); return -1; } err = clWaitForEvents(1, &consumer_sync_event); if ( err != CL_SUCCESS ){ print_error( err, " clWaitForEvents failed" ); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); for(j = 0; j < max_pipe_args; j++) { clReleaseMemObject(pipes[j]); } clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseEvent(producer_sync_event); clReleaseEvent(consumer_sync_event); clReleaseProgram(program); align_free(outptr); free(source); return -1; } if( verify_result( inptr, outptr, num_pipe_elements*sizeof(cl_int))){ log_error("test_pipe_max_args failed\n"); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); for(j = 0; j < max_pipe_args; j++) { clReleaseMemObject(pipes[j]); } clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseEvent(producer_sync_event); clReleaseEvent(consumer_sync_event); clReleaseProgram(program); align_free(outptr); free(source); return -1; } else { log_info("test_pipe_max_args passed\n"); } //cleanup clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); for(j = 0; j < max_pipe_args; j++) { clReleaseMemObject(pipes[j]); } clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseEvent(producer_sync_event); clReleaseEvent(consumer_sync_event); clReleaseProgram(program); align_free(outptr); free(source); return 0; } int test_pipe_max_packet_size(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { cl_mem pipe; cl_mem buffers[2]; void *outptr; cl_char *inptr; cl_program program; cl_kernel kernel[2]; size_t global_work_size[3]; cl_int err; size_t size; int num_pipe_elements = 1024; int i; cl_uint max_pipe_packet_size; char *source; char str[256]; int str_length; cl_event producer_sync_event = NULL; cl_event consumer_sync_event = NULL; MTdata d = init_genrand( gRandomSeed ); const char* kernelName[] = {"test_pipe_max_packet_size_write", "test_pipe_max_packet_size_read"}; size_t min_alignment = get_min_alignment(context); global_work_size[0] = (cl_uint)num_pipe_elements; source = (char*)malloc(STRING_LENGTH*sizeof(char)); err = clGetDeviceInfo(deviceID, CL_DEVICE_PIPE_MAX_PACKET_SIZE, sizeof(max_pipe_packet_size), (void*)&max_pipe_packet_size, NULL); if(err){ print_error(err, " clGetDeviceInfo failed\n"); return -1; } if(max_pipe_packet_size < 1024){ log_error("The device should support minimum packet size of 1024 bytes"); return -1; } if(max_pipe_packet_size > (32*1024*1024/num_pipe_elements)) { max_pipe_packet_size = 32*1024*1024/num_pipe_elements; } size = max_pipe_packet_size * num_pipe_elements; inptr = (cl_char *)align_malloc(size, min_alignment); for(i = 0; i < size; i++){ inptr[i] = (char)genrand_int32(d); } buffers[0] = clCreateBuffer(context, CL_MEM_COPY_HOST_PTR, size, inptr, &err); if(err){ clReleaseMemObject(buffers[0]); free(source); print_error(err, " clCreateBuffer failed\n"); return -1; } outptr = align_malloc(size, min_alignment); buffers[1] = clCreateBuffer(context, CL_MEM_USE_HOST_PTR, size, outptr, &err); if ( err ){ clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free( outptr ); free(source); print_error(err, " clCreateBuffer failed\n" ); return -1; } pipe = clCreatePipe(context, CL_MEM_HOST_NO_ACCESS, max_pipe_packet_size, num_pipe_elements, NULL, &err); if(err){ clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free( outptr ); free(source); clReleaseMemObject(pipe); print_error(err, " clCreatePipe failed\n"); return -1; } sprintf(str, "typedef struct{\n char a[%d];\n}TestStruct;\n\n__kernel void test_pipe_max_packet_size_write(__global TestStruct *src, __write_only pipe TestStruct out_pipe)\n{\n", max_pipe_packet_size); strcpy(source,str); strcat(source, " int gid = get_global_id(0);\n reserve_id_t res_id;\n\n"); sprintf(str, " res_id = reserve_write_pipe(out_pipe, 1);\n if(is_valid_reserve_id(res_id))\n {\n"); strcat(source, str); sprintf(str, " write_pipe(out_pipe, res_id, 0, &src[gid]);\n commit_write_pipe(out_pipe, res_id);\n }\n}\n\n"); strcat(source, str); sprintf(str, "__kernel void test_pipe_max_packet_size_read(__read_only pipe TestStruct in_pipe, __global TestStruct *dst)\n{\n"); strcat(source, str); strcat(source, " int gid = get_global_id(0);\n reserve_id_t res_id;\n\n"); sprintf(str, " res_id = reserve_read_pipe(in_pipe, 1);\n if(is_valid_reserve_id(res_id))\n {\n"); strcat(source, str); sprintf(str, " read_pipe(in_pipe, res_id, 0, &dst[gid]);\n commit_read_pipe(in_pipe, res_id);\n }\n}\n\n"); strcat(source, str); str_length = strlen(source); assert(str_length <= STRING_LENGTH); // Create producer kernel err = create_single_kernel_helper_with_build_options(context, &program, &kernel[0], 1, (const char**)&source, kernelName[0], "-cl-std=CL2.0"); if(err){ clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); clReleaseMemObject(pipe); align_free(outptr); free(source); print_error(err, "Error creating program\n"); return -1; } //Create consumer kernel kernel[1] = clCreateKernel(program, kernelName[1], &err); if( kernel[1] == NULL || err != CL_SUCCESS) { clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); clReleaseMemObject(pipe); align_free(outptr); free(source); print_error(err, "Error creating kernel\n"); return -1; } err = clSetKernelArg(kernel[0], 0, sizeof(cl_mem), (void*)&buffers[0]); err |= clSetKernelArg(kernel[0], 1, sizeof(cl_mem), (void*)&pipe); err |= clSetKernelArg(kernel[1], 0, sizeof(cl_mem), (void*)&pipe); err |= clSetKernelArg(kernel[1], 1, sizeof(cl_mem), (void*)&buffers[1]); if ( err != CL_SUCCESS ){ clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); clReleaseMemObject(pipe); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseProgram(program); align_free(outptr); free(source); print_error(err, " clSetKernelArg failed"); return -1; } // Launch Producer kernel err = clEnqueueNDRangeKernel( queue, kernel[0], 1, NULL, global_work_size, NULL, 0, NULL, &producer_sync_event ); if ( err != CL_SUCCESS ){ print_error( err, " clEnqueueNDRangeKernel failed" ); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); clReleaseMemObject(pipe); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseEvent(producer_sync_event); clReleaseEvent(consumer_sync_event); clReleaseProgram(program); align_free(outptr); free(source); return -1; } // Launch Consumer kernel err = clEnqueueNDRangeKernel( queue, kernel[1], 1, NULL, global_work_size, NULL, 1, &producer_sync_event, &consumer_sync_event ); if ( err != CL_SUCCESS ){ print_error( err, " clEnqueueNDRangeKernel failed" ); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); clReleaseMemObject(pipe); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseEvent(producer_sync_event); clReleaseEvent(consumer_sync_event); clReleaseProgram(program); align_free(outptr); free(source); return -1; } err = clEnqueueReadBuffer(queue, buffers[1], true, 0, size, outptr, 1, &consumer_sync_event, NULL); if ( err != CL_SUCCESS ){ print_error( err, " clEnqueueReadBuffer failed" ); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); clReleaseMemObject(pipe); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseEvent(producer_sync_event); clReleaseEvent(consumer_sync_event); clReleaseProgram(program); align_free(outptr); free(source); return -1; } if( verify_result( inptr, outptr, size)){ log_error("test_pipe_max_packet_size failed\n"); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); clReleaseMemObject(pipe); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseEvent(producer_sync_event); clReleaseEvent(consumer_sync_event); clReleaseProgram(program); align_free(outptr); free(source); return -1; } else { log_info("test_pipe_max_packet_size passed\n"); } //cleanup clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); clReleaseMemObject(pipe); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseEvent(producer_sync_event); clReleaseEvent(consumer_sync_event); clReleaseProgram(program); align_free(outptr); free(source); return 0; } int test_pipe_max_active_reservations(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements) { cl_mem pipe; cl_mem buffers[2]; cl_mem buf_reservations; cl_mem buf_status; cl_mem buf_reserve_id_t_size; cl_mem buf_reserve_id_t_size_aligned; cl_int *inptr; void *outptr; int size, i; cl_program program; cl_kernel kernel[3]; size_t global_work_size[3]; cl_int err; int status = 0; cl_uint max_active_reservations = 0; cl_ulong max_global_size = 0; int reserve_id_t_size; int temp; char *source; char str[256]; int str_length; cl_event sync_event = NULL; cl_event read_event = NULL; MTdata d = init_genrand( gRandomSeed ); const char* kernelName[3] = {"test_pipe_max_active_reservations_write", "test_pipe_max_active_reservations_read", "pipe_get_reserve_id_t_size"}; size_t min_alignment = get_min_alignment(context); source = (char*)malloc(2*STRING_LENGTH*sizeof(char)); global_work_size[0] = 1; err = clGetDeviceInfo(deviceID, CL_DEVICE_PIPE_MAX_ACTIVE_RESERVATIONS, sizeof(max_active_reservations), (void*)&max_active_reservations, NULL); if(err){ print_error(err, " clGetDeviceInfo failed\n"); return -1; } err = clGetDeviceInfo(deviceID, CL_DEVICE_GLOBAL_MEM_SIZE, sizeof(max_global_size), (void*)&max_global_size, NULL); if(err){ print_error(err, " clGetDeviceInfo failed\n"); return -1; } max_active_reservations = (max_active_reservations > max_global_size) ? 1<<16 : max_active_reservations; if(max_active_reservations < 1){ log_error("The device should support minimum active reservations of 1"); return -1; } // To get reserve_id_t size buf_reserve_id_t_size = clCreateBuffer(context, CL_MEM_HOST_READ_ONLY, sizeof(reserve_id_t_size), NULL, &err); if ( err ){ clReleaseMemObject(buf_reserve_id_t_size); print_error(err, " clCreateBuffer failed\n" ); return -1; } sprintf(str, "__kernel void test_pipe_max_active_reservations_write(__global int *src, __write_only pipe int out_pipe, __global char *reserve_id, __global int *reserve_id_t_size_aligned, __global int *status)\n{\n"); strcpy(source,str); sprintf(str, " __global reserve_id_t *res_id_ptr;\n int reserve_idx;\n int commit_idx;\n"); strcat(source, str); sprintf(str, " for(reserve_idx = 0; reserve_idx < %d; reserve_idx++)\n {\n", max_active_reservations); strcat(source, str); sprintf(str, " res_id_ptr = (__global reserve_id_t*)(reserve_id + reserve_idx*reserve_id_t_size_aligned[0]);\n"); strcat(source, str); sprintf(str, " *res_id_ptr = reserve_write_pipe(out_pipe, 1);\n"); strcat(source, str); sprintf(str, " if(is_valid_reserve_id(res_id_ptr[0]))\n {\n write_pipe(out_pipe, res_id_ptr[0], 0, &src[reserve_idx]);\n }\n"); strcat(source, str); sprintf(str, " else\n {\n *status = -1;\n return;\n }\n }\n"); strcat(source, str); sprintf(str, " for(commit_idx = 0; commit_idx < %d; commit_idx++)\n {\n", max_active_reservations); strcat(source, str); sprintf(str, " res_id_ptr = (__global reserve_id_t*)(reserve_id + commit_idx*reserve_id_t_size_aligned[0]);\n"); strcat(source, str); sprintf(str, " commit_write_pipe(out_pipe, res_id_ptr[0]);\n }\n}\n\n"); strcat(source, str); sprintf(str, "__kernel void test_pipe_max_active_reservations_read(__read_only pipe int in_pipe, __global int *dst, __global char *reserve_id, __global int *reserve_id_t_size_aligned, __global int *status)\n{\n"); strcat(source, str); sprintf(str, " __global reserve_id_t *res_id_ptr;\n int reserve_idx;\n int commit_idx;\n"); strcat(source, str); sprintf(str, " for(reserve_idx = 0; reserve_idx < %d; reserve_idx++)\n {\n", max_active_reservations); strcat(source, str); sprintf(str, " res_id_ptr = (__global reserve_id_t*)(reserve_id + reserve_idx*reserve_id_t_size_aligned[0]);\n"); strcat(source, str); sprintf(str, " *res_id_ptr = reserve_read_pipe(in_pipe, 1);\n"); strcat(source, str); sprintf(str, " if(is_valid_reserve_id(res_id_ptr[0]))\n {\n read_pipe(in_pipe, res_id_ptr[0], 0, &dst[reserve_idx]);\n }\n"); strcat(source, str); sprintf(str, " else\n {\n *status = -1;\n return;\n }\n }\n"); strcat(source, str); sprintf(str, " for(commit_idx = 0; commit_idx < %d; commit_idx++)\n {\n", max_active_reservations); strcat(source, str); sprintf(str, " res_id_ptr = (__global reserve_id_t*)(reserve_id + commit_idx*reserve_id_t_size_aligned[0]);\n"); strcat(source, str); sprintf(str, " commit_read_pipe(in_pipe, res_id_ptr[0]);\n }\n}\n\n"); strcat(source, str); sprintf(str, "__kernel void pipe_get_reserve_id_t_size(__global int *reserve_id_t_size) \n"); strcat(source, str); sprintf(str, "{\n *reserve_id_t_size = sizeof(reserve_id_t);\n}\n"); strcat(source, str); str_length = strlen(source); assert(str_length <= 2*STRING_LENGTH); // Create producer kernel err = create_single_kernel_helper_with_build_options(context, &program, &kernel[0], 1, (const char**)&source, kernelName[0], "-cl-std=CL2.0"); if(err){ clReleaseMemObject(buf_reserve_id_t_size); print_error(err, "Error creating program\n"); return -1; } // Create consumer kernel kernel[1] = clCreateKernel(program, kernelName[1], &err); if( kernel[1] == NULL || err != CL_SUCCESS) { clReleaseMemObject(buf_reserve_id_t_size); print_error(err, "Error creating kernel\n"); return -1; } // Create size query kernel for reserve_id_t kernel[2] = clCreateKernel(program, kernelName[2], &err); if( kernel[2] == NULL || err != CL_SUCCESS) { clReleaseMemObject(buf_reserve_id_t_size); print_error(err, "Error creating kernel\n"); return -1; } err = clSetKernelArg(kernel[2], 0, sizeof(cl_mem), (void*)&buf_reserve_id_t_size); if(err){ clReleaseMemObject(buf_reserve_id_t_size); print_error(err, "Error creating program\n"); return -1; } //Launch size query kernel for reserve_id_t err = clEnqueueNDRangeKernel( queue, kernel[2], 1, NULL, global_work_size, NULL, 0, NULL, &sync_event ); if ( err != CL_SUCCESS ){ print_error( err, " clEnqueueNDRangeKernel failed" ); clReleaseMemObject(buf_reserve_id_t_size); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseProgram(program); return -1; } err = clEnqueueReadBuffer(queue, buf_reserve_id_t_size, true, 0, sizeof(reserve_id_t_size), &reserve_id_t_size, 1, &sync_event, &read_event); if ( err != CL_SUCCESS ){ print_error( err, " clEnqueueReadBuffer failed" ); clReleaseMemObject(buf_reserve_id_t_size); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseProgram(program); return -1; } err = clWaitForEvents(1, &read_event); if ( err != CL_SUCCESS ){ print_error( err, " clWaitForEvents failed" ); clReleaseMemObject(buf_reserve_id_t_size); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseEvent(read_event); clReleaseProgram(program); return -1; } // Round reserve_id_t_size to the nearest power of 2 temp = 1; while(temp < reserve_id_t_size) temp *= 2; reserve_id_t_size = temp; size = sizeof(cl_int) * max_active_reservations; inptr = (cl_int *)align_malloc(size, min_alignment); for(i = 0; i < max_active_reservations; i++){ inptr[i] = (int)genrand_int32(d); } buffers[0] = clCreateBuffer(context, CL_MEM_COPY_HOST_PTR, size, inptr, &err); if ( err ){ clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buffers[0]); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseEvent(read_event); clReleaseProgram(program); print_error(err, " clCreateBuffer failed\n" ); return -1; } outptr = align_malloc(size, min_alignment); buffers[1] = clCreateBuffer(context, CL_MEM_HOST_READ_ONLY, size, NULL, &err); if ( err ){ clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseEvent(read_event); clReleaseProgram(program); align_free(outptr); print_error(err, " clCreateBuffer failed\n" ); return -1; } buf_reserve_id_t_size_aligned = clCreateBuffer(context, CL_MEM_COPY_HOST_PTR, sizeof(reserve_id_t_size), &reserve_id_t_size, &err); if ( err ){ clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseEvent(read_event); clReleaseProgram(program); print_error(err, " clCreateBuffer failed\n" ); return -1; } //For error status buf_status = clCreateBuffer(context, CL_MEM_COPY_HOST_PTR, sizeof(int), &status, &err); if ( err ){ clReleaseMemObject(buf_status); clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free(outptr); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseEvent(read_event); clReleaseProgram(program); print_error(err, " clCreateBuffer failed\n" ); return -1; } pipe = clCreatePipe(context, CL_MEM_HOST_NO_ACCESS, sizeof(int), max_active_reservations, NULL, &err); if(err){ clReleaseMemObject(buf_status); clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(pipe); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free(outptr); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseEvent(read_event); clReleaseProgram(program); print_error(err, " clCreatePipe failed\n"); return -1; } // Global buffer to hold all active reservation ids buf_reservations = clCreateBuffer(context, CL_MEM_HOST_NO_ACCESS, reserve_id_t_size*max_active_reservations, NULL, &err); if ( err != CL_SUCCESS ){ print_error( err, " clCreateBuffer failed" ); clReleaseMemObject(buf_status); clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(buf_reservations); clReleaseMemObject(pipe); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free(outptr); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseEvent(read_event); clReleaseProgram(program); return -1; } err = clSetKernelArg(kernel[0], 0, sizeof(cl_mem), (void*)&buffers[0]); err |= clSetKernelArg(kernel[0], 1, sizeof(cl_mem), (void*)&pipe); err |= clSetKernelArg(kernel[0], 2, sizeof(cl_mem), (void*)&buf_reservations); err |= clSetKernelArg(kernel[0], 3, sizeof(cl_mem), (void*)&buf_reserve_id_t_size_aligned); err |= clSetKernelArg(kernel[0], 4, sizeof(cl_mem), (void*)&buf_status); if ( err != CL_SUCCESS ){ clReleaseMemObject(buf_status); clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(buf_reservations); clReleaseMemObject(pipe); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free(outptr); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseProgram(program); print_error(err, " clSetKernelArg failed"); return -1; } err = clSetKernelArg(kernel[1], 0, sizeof(cl_mem), (void*)&pipe); err |= clSetKernelArg(kernel[1], 1, sizeof(cl_mem), (void*)&buffers[1]); err |= clSetKernelArg(kernel[1], 2, sizeof(cl_mem), (void*)&buf_reservations); err |= clSetKernelArg(kernel[1], 3, sizeof(cl_mem), (void*)&buf_reserve_id_t_size_aligned); err |= clSetKernelArg(kernel[1], 4, sizeof(cl_mem), (void*)&buf_status); if ( err != CL_SUCCESS ){ clReleaseMemObject(buf_status); clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(buf_reservations); clReleaseMemObject(pipe); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free(outptr); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseProgram(program); print_error(err, " clSetKernelArg failed"); return -1; } // Launch Producer kernel err = clEnqueueNDRangeKernel(queue, kernel[0], 1, NULL, global_work_size, NULL, 0, NULL, &sync_event); if ( err != CL_SUCCESS ){ print_error( err, " clEnqueueNDRangeKernel failed" ); clReleaseMemObject(buf_status); clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(buf_reservations); clReleaseMemObject(pipe); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free(outptr); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseProgram(program); return -1; } err = clEnqueueReadBuffer(queue, buf_status, true, 0, sizeof(int), &status, 1, &sync_event, NULL); if ( err != CL_SUCCESS ){ print_error( err, " clEnqueueReadBuffer failed" ); clReleaseMemObject(buf_status); clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(buf_reservations); clReleaseMemObject(pipe); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free(outptr); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseProgram(program); return -1; } if(status != 0) { log_error("test_pipe_max_active_reservations failed\n"); clReleaseMemObject(buf_status); clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(buf_reservations); clReleaseMemObject(pipe); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free(outptr); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseEvent(sync_event); clReleaseProgram(program); return -1; } // Launch Consumer kernel err = clEnqueueNDRangeKernel(queue, kernel[1], 1, NULL, global_work_size, NULL, 0, NULL, &sync_event); if ( err != CL_SUCCESS ){ print_error( err, " clEnqueueNDRangeKernel failed" ); clReleaseMemObject(buf_status); clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(buf_reservations); clReleaseMemObject(pipe); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free(outptr); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseProgram(program); return -1; } err = clEnqueueReadBuffer(queue, buf_status, true, 0, sizeof(int), &status, 1, &sync_event, NULL); if ( err != CL_SUCCESS ){ print_error( err, " clEnqueueReadBuffer failed" ); clReleaseMemObject(buf_status); clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(buf_reservations); clReleaseMemObject(pipe); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free(outptr); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseProgram(program); return -1; } if(status != 0) { log_error("test_pipe_max_active_reservations failed\n"); clReleaseMemObject(buf_status); clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(buf_reservations); clReleaseMemObject(pipe); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free(outptr); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseEvent(sync_event); clReleaseProgram(program); return -1; } err = clEnqueueReadBuffer(queue, buffers[1], true, 0, size, outptr, 1, &sync_event, NULL); if ( err != CL_SUCCESS ){ print_error( err, " clEnqueueReadBuffer failed" ); clReleaseMemObject(buf_status); clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(buf_reservations); clReleaseMemObject(pipe); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free(outptr); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseProgram(program); return -1; } if( verify_result_int( inptr, outptr, max_active_reservations)){ log_error("test_pipe_max_active_reservations failed\n"); clReleaseMemObject(buf_status); clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(buf_reservations); clReleaseMemObject(pipe); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free(outptr); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseKernel(kernel[2]); clReleaseEvent(sync_event); clReleaseProgram(program); return -1; } else { log_info("test_pipe_max_active_reservations passed\n"); } //cleanup clReleaseMemObject(buf_status); clReleaseMemObject(buf_reserve_id_t_size); clReleaseMemObject(buf_reserve_id_t_size_aligned); clReleaseMemObject(buf_reservations); clReleaseMemObject(pipe); clReleaseMemObject(buffers[0]); clReleaseMemObject(buffers[1]); align_free(outptr); clReleaseKernel(kernel[0]); clReleaseKernel(kernel[1]); clReleaseEvent(sync_event); clReleaseProgram(program); return 0; }