mirror of
https://github.com/KhronosGroup/OpenCL-CTS.git
synced 2026-03-19 14:09:03 +00:00
219 lines
7.5 KiB
C++
219 lines
7.5 KiB
C++
//
|
|
// Copyright (c) 2017 The Khronos Group Inc.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
//
|
|
#ifndef TEST_CONFORMANCE_CLCPP_WG_TEST_WG_ANY_HPP
|
|
#define TEST_CONFORMANCE_CLCPP_WG_TEST_WG_ANY_HPP
|
|
|
|
#include <vector>
|
|
#include <limits>
|
|
#include <algorithm>
|
|
|
|
// Common for all OpenCL C++ tests
|
|
#include "../common.hpp"
|
|
// Common for tests of work-group functions
|
|
#include "common.hpp"
|
|
|
|
// -----------------------------------------------------------------------------------
|
|
// ------------- ONLY FOR OPENCL 22 CONFORMANCE TEST 22 DEVELOPMENT ------------------
|
|
// -----------------------------------------------------------------------------------
|
|
#if defined(DEVELOPMENT) && defined(USE_OPENCLC_KERNELS)
|
|
std::string generate_wg_any_kernel_code()
|
|
{
|
|
return
|
|
"__kernel void test_wg_any(global uint *input, global uint *output)\n"
|
|
"{\n"
|
|
" ulong tid = get_global_id(0);\n"
|
|
"\n"
|
|
" int result = work_group_any(input[tid] == input[tid+1]);\n"
|
|
" if(result == 0) {\n output[tid] = 0;\n return;\n }\n"
|
|
" output[tid] = 1;\n"
|
|
"}\n";
|
|
}
|
|
#else
|
|
std::string generate_wg_any_kernel_code()
|
|
{
|
|
return "#include <opencl_memory>\n"
|
|
"#include <opencl_work_item>\n"
|
|
"#include <opencl_work_group>\n"
|
|
"using namespace cl;\n"
|
|
"__kernel void test_wg_any(global_ptr<uint[]> input, global_ptr<uint[]> output)\n"
|
|
"{\n"
|
|
" ulong tid = get_global_id(0);\n"
|
|
" bool result = work_group_any(input[tid] == input[tid+1]);\n"
|
|
" if(!result) {\n output[tid] = 0;\n return;\n }\n"
|
|
" output[tid] = 1;\n"
|
|
"}\n";
|
|
}
|
|
#endif
|
|
|
|
int verify_wg_any(const std::vector<cl_uint> &in, const std::vector<cl_uint> &out, size_t count, size_t wg_size)
|
|
{
|
|
size_t i, j;
|
|
for (i = 0; i < count; i += wg_size)
|
|
{
|
|
// Work-group any
|
|
bool any = false;
|
|
for (j = 0; j < ((count - i) > wg_size ? wg_size : (count - i)); j++)
|
|
{
|
|
if(in[i+j] == in[i+j+1])
|
|
{
|
|
any = true;
|
|
break;
|
|
}
|
|
}
|
|
|
|
// Convert bool to uint
|
|
cl_uint any_uint = any ? 1 : 0;
|
|
// Check if all work-items in work-group stored correct value
|
|
for (j = 0; j < ((count - i) > wg_size ? wg_size : (count - i)); j++)
|
|
{
|
|
if (any_uint != out[i + j])
|
|
{
|
|
log_info(
|
|
"work_group_any %s: Error at %lu: expected = %lu, got = %lu\n",
|
|
type_name<cl_uint>().c_str(),
|
|
i + j,
|
|
static_cast<size_t>(any_uint),
|
|
static_cast<size_t>(out[i + j]));
|
|
return -1;
|
|
}
|
|
}
|
|
}
|
|
return CL_SUCCESS;
|
|
}
|
|
|
|
std::vector<cl_uint> generate_input_wg_any(size_t count, size_t wg_size)
|
|
{
|
|
std::vector<cl_uint> input(count, cl_uint(0));
|
|
size_t j = wg_size;
|
|
for(size_t i = 0; i < count; i++)
|
|
{
|
|
input[i] = static_cast<cl_uint>(i);
|
|
// In one place in ~half of workgroups input[tid] == input[tid+1] will
|
|
// generate true, that means for that workgroups work_group_any()
|
|
// should return true
|
|
if((j == wg_size/2) && (i > count/2))
|
|
{
|
|
input[i] = input[i - 1];
|
|
}
|
|
j--;
|
|
if(j == 0)
|
|
{
|
|
j = wg_size;
|
|
}
|
|
}
|
|
return input;
|
|
}
|
|
|
|
std::vector<cl_uint> generate_output_wg_any(size_t count, size_t wg_size)
|
|
{
|
|
(void) wg_size;
|
|
return std::vector<cl_uint>(count, cl_uint(1));
|
|
}
|
|
|
|
int work_group_any(cl_device_id device, cl_context context, cl_command_queue queue, size_t count)
|
|
{
|
|
cl_mem buffers[2];
|
|
cl_program program;
|
|
cl_kernel kernel;
|
|
size_t wg_size;
|
|
size_t work_size[1];
|
|
int err;
|
|
|
|
std::string code_str = generate_wg_any_kernel_code();
|
|
// -----------------------------------------------------------------------------------
|
|
// ------------- ONLY FOR OPENCL 22 CONFORMANCE TEST 22 DEVELOPMENT ------------------
|
|
// -----------------------------------------------------------------------------------
|
|
// Only OpenCL C++ to SPIR-V compilation
|
|
#if defined(DEVELOPMENT) && defined(ONLY_SPIRV_COMPILATION)
|
|
err = create_opencl_kernel(context, &program, &kernel, code_str, "test_wg_any");
|
|
RETURN_ON_ERROR(err)
|
|
return err;
|
|
// Use OpenCL C kernels instead of OpenCL C++ kernels (test C++ host code)
|
|
#elif defined(DEVELOPMENT) && defined(USE_OPENCLC_KERNELS)
|
|
err = create_opencl_kernel(context, &program, &kernel, code_str, "test_wg_any", "-cl-std=CL2.0", false);
|
|
RETURN_ON_ERROR(err)
|
|
#else
|
|
err = create_opencl_kernel(context, &program, &kernel, code_str, "test_wg_any");
|
|
RETURN_ON_ERROR(err)
|
|
#endif
|
|
|
|
err = clGetKernelWorkGroupInfo(kernel, device, CL_KERNEL_WORK_GROUP_SIZE, sizeof(size_t), &wg_size, NULL);
|
|
RETURN_ON_CL_ERROR(err, "clGetKernelWorkGroupInfo")
|
|
|
|
// Calculate global work size
|
|
size_t flat_work_size;
|
|
size_t wg_number = static_cast<size_t>(
|
|
std::ceil(static_cast<double>(count) / wg_size)
|
|
);
|
|
flat_work_size = wg_number * wg_size;
|
|
work_size[0] = flat_work_size;
|
|
|
|
std::vector<cl_uint> input = generate_input_wg_any(flat_work_size + 1, wg_size);
|
|
std::vector<cl_uint> output = generate_output_wg_any(flat_work_size, wg_size);
|
|
|
|
buffers[0] = clCreateBuffer(context, (cl_mem_flags)(CL_MEM_READ_WRITE), sizeof(cl_uint) * input.size(), NULL, &err);
|
|
RETURN_ON_CL_ERROR(err, "clCreateBuffer");
|
|
|
|
buffers[1] = clCreateBuffer(context, (cl_mem_flags)(CL_MEM_READ_WRITE), sizeof(cl_uint) * output.size(), NULL, &err);
|
|
RETURN_ON_CL_ERROR(err, "clCreateBuffer");
|
|
|
|
err = clEnqueueWriteBuffer(
|
|
queue, buffers[0], CL_TRUE, 0, sizeof(cl_uint) * input.size(),
|
|
static_cast<void *>(input.data()), 0, NULL, NULL
|
|
);
|
|
RETURN_ON_CL_ERROR(err, "clEnqueueWriteBuffer");
|
|
|
|
err = clSetKernelArg(kernel, 0, sizeof(buffers[0]), &buffers[0]);
|
|
err |= clSetKernelArg(kernel, 1, sizeof(buffers[1]), &buffers[1]);
|
|
RETURN_ON_CL_ERROR(err, "clSetKernelArg");
|
|
|
|
err = clEnqueueNDRangeKernel(queue, kernel, 1, NULL, work_size, &wg_size, 0, NULL, NULL);
|
|
RETURN_ON_CL_ERROR(err, "clEnqueueNDRangeKernel");
|
|
|
|
err = clEnqueueReadBuffer(
|
|
queue, buffers[1], CL_TRUE, 0, sizeof(cl_uint) * output.size(),
|
|
static_cast<void *>(output.data()), 0, NULL, NULL
|
|
);
|
|
RETURN_ON_CL_ERROR(err, "clEnqueueReadBuffer");
|
|
|
|
if (verify_wg_any(input, output, flat_work_size, wg_size) != CL_SUCCESS)
|
|
{
|
|
RETURN_ON_ERROR_MSG(-1, "work_group_any failed");
|
|
}
|
|
log_info("work_group_any passed\n");
|
|
|
|
clReleaseMemObject(buffers[0]);
|
|
clReleaseMemObject(buffers[1]);
|
|
clReleaseKernel(kernel);
|
|
clReleaseProgram(program);
|
|
return err;
|
|
}
|
|
|
|
AUTO_TEST_CASE(test_work_group_any)
|
|
(cl_device_id device, cl_context context, cl_command_queue queue, int n_elems)
|
|
{
|
|
int err = CL_SUCCESS;
|
|
|
|
err = work_group_any(device, context, queue, n_elems);
|
|
CHECK_ERROR(err)
|
|
|
|
if(err != CL_SUCCESS)
|
|
return -1;
|
|
return CL_SUCCESS;
|
|
}
|
|
|
|
#endif // TEST_CONFORMANCE_CLCPP_WG_TEST_WG_ANY_HPP
|