mirror of
https://github.com/KhronosGroup/OpenCL-CTS.git
synced 2026-03-19 06:09:01 +00:00
734 lines
20 KiB
C++
734 lines
20 KiB
C++
//
|
|
// Copyright (c) 2017 The Khronos Group Inc.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
//
|
|
#ifndef TEST_CONFORMANCE_CLCPP_MATH_FUNCS_FP_FUNCS_HPP
|
|
#define TEST_CONFORMANCE_CLCPP_MATH_FUNCS_FP_FUNCS_HPP
|
|
|
|
#include <type_traits>
|
|
#include <cmath>
|
|
|
|
#include "common.hpp"
|
|
|
|
// -------------- UNARY FUNCTIONS
|
|
|
|
// gentype ceil(gentype x);
|
|
// gentype floor(gentype x);
|
|
// gentype rint(gentype x);
|
|
// gentype round(gentype x);
|
|
// gentype trunc(gentype x);
|
|
// group_name, func_name, reference_func, use_ulp, ulp, ulp_for_embedded, max_delta, min1, max1
|
|
MATH_FUNCS_DEFINE_UNARY_FUNC(fp, ceil, std::ceil, true, 0.0f, 0.0f, 0.001f, -1000.0f, 1000.0f)
|
|
MATH_FUNCS_DEFINE_UNARY_FUNC(fp, floor, std::floor, true, 0.0f, 0.0f, 0.001f, -1000.0f, 1000.0f)
|
|
MATH_FUNCS_DEFINE_UNARY_FUNC(fp, rint, std::rint, true, 0.0f, 0.0f, 0.001f, -1000.0f, 1000.0f)
|
|
MATH_FUNCS_DEFINE_UNARY_FUNC(fp, round, std::round, true, 0.0f, 0.0f, 0.001f, -1000.0f, 1000.0f)
|
|
MATH_FUNCS_DEFINE_UNARY_FUNC(fp, trunc, std::trunc, true, 0.0f, 0.0f, 0.001f, -1000.0f, 1000.0f)
|
|
|
|
// floatn nan(uintn nancode);
|
|
struct fp_func_nan : public unary_func<cl_uint, cl_float>
|
|
{
|
|
std::string str()
|
|
{
|
|
return "nan";
|
|
}
|
|
|
|
std::string headers()
|
|
{
|
|
return "#include <opencl_math>\n";
|
|
}
|
|
|
|
cl_float operator()(const cl_uint& x)
|
|
{
|
|
cl_uint r = x | 0x7fc00000U;
|
|
// cl_float and cl_int have the same size so that's correct
|
|
cl_float rf = *reinterpret_cast<cl_float*>(&r);
|
|
return rf;
|
|
}
|
|
|
|
cl_uint min1()
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
cl_uint max1()
|
|
{
|
|
return 100;
|
|
}
|
|
|
|
std::vector<cl_uint> in1_special_cases()
|
|
{
|
|
return {
|
|
0, 1
|
|
};
|
|
}
|
|
};
|
|
|
|
// -------------- UNARY FUNCTIONS, 2ND ARG IS POINTER
|
|
|
|
// gentype fract(gentype x, gentype* iptr);
|
|
//
|
|
// Fuction fract() returns additional value via pointer (2nd argument). In order to test
|
|
// if it's correct output buffer type is cl_float2. In first compontent we store what
|
|
// fract() function returns, and in the 2nd component we store what is returned via its
|
|
// 2nd argument (gentype* iptr).
|
|
struct fp_func_fract : public unary_func<cl_float, cl_float2>
|
|
{
|
|
fp_func_fract(bool is_embedded) : m_is_embedded(is_embedded)
|
|
{
|
|
|
|
}
|
|
|
|
std::string str()
|
|
{
|
|
return "fract";
|
|
}
|
|
|
|
std::string headers()
|
|
{
|
|
return "#include <opencl_math>\n";
|
|
}
|
|
|
|
cl_double2 operator()(const cl_float& x)
|
|
{
|
|
return reference::fract(static_cast<cl_double>(x));
|
|
}
|
|
|
|
cl_float min1()
|
|
{
|
|
return -1000.0f;
|
|
}
|
|
|
|
cl_float max1()
|
|
{
|
|
return 1000.0f;
|
|
}
|
|
|
|
std::vector<cl_float> in1_special_cases()
|
|
{
|
|
return {
|
|
cl_float(0.0f),
|
|
cl_float(-0.0f),
|
|
cl_float(1.0f),
|
|
cl_float(-1.0f),
|
|
cl_float(2.0f),
|
|
cl_float(-2.0f),
|
|
std::numeric_limits<cl_float>::infinity(),
|
|
-std::numeric_limits<cl_float>::infinity(),
|
|
std::numeric_limits<cl_float>::quiet_NaN()
|
|
};
|
|
}
|
|
|
|
bool use_ulp()
|
|
{
|
|
return true;
|
|
}
|
|
|
|
float ulp()
|
|
{
|
|
if(m_is_embedded)
|
|
{
|
|
return 0.0f;
|
|
}
|
|
return 0.0f;
|
|
}
|
|
private:
|
|
bool m_is_embedded;
|
|
};
|
|
|
|
// We need to specialize generate_kernel_unary<>() function template for fp_func_fract.
|
|
// -----------------------------------------------------------------------------------
|
|
// ------------- ONLY FOR OPENCL 22 CONFORMANCE TEST 22 DEVELOPMENT ------------------
|
|
// -----------------------------------------------------------------------------------
|
|
#if defined(DEVELOPMENT) && defined(USE_OPENCLC_KERNELS)
|
|
template <>
|
|
std::string generate_kernel_unary<fp_func_fract, cl_float, cl_float2>(fp_func_fract func)
|
|
{
|
|
return
|
|
"__kernel void test_fract(global float *input, global float2 *output)\n"
|
|
"{\n"
|
|
" size_t gid = get_global_id(0);\n"
|
|
" float2 result;\n"
|
|
" float itpr = 0;\n"
|
|
" result.x = fract(input[gid], &itpr);\n"
|
|
" result.y = itpr;\n"
|
|
" output[gid] = result;\n"
|
|
"}\n";
|
|
}
|
|
#else
|
|
template <>
|
|
std::string generate_kernel_unary<fp_func_fract, cl_float, cl_float2>(fp_func_fract func)
|
|
{
|
|
return
|
|
"" + func.defs() +
|
|
"" + func.headers() +
|
|
"#include <opencl_memory>\n"
|
|
"#include <opencl_work_item>\n"
|
|
"using namespace cl;\n"
|
|
"__kernel void test_fract(global_ptr<float[]> input, global_ptr<float2[]> output)\n"
|
|
"{\n"
|
|
" size_t gid = get_global_id(0);\n"
|
|
" float2 result;\n"
|
|
" float itpr = 0;\n"
|
|
" result.x = fract(input[gid], &itpr);\n"
|
|
" result.y = itpr;\n"
|
|
" output[gid] = result;\n"
|
|
"}\n";
|
|
}
|
|
#endif
|
|
|
|
// gentype modf(gentype x, gentype* iptr);
|
|
//
|
|
// Fuction modf() returns additional value via pointer (2nd argument). In order to test
|
|
// if it's correct output buffer type is cl_float2. In first compontent we store what
|
|
// modf() function returns, and in the 2nd component we store what is returned via its
|
|
// 2nd argument (gentype* iptr).
|
|
struct fp_func_modf : public unary_func<cl_float, cl_float2>
|
|
{
|
|
fp_func_modf(bool is_embedded) : m_is_embedded(is_embedded)
|
|
{
|
|
|
|
}
|
|
|
|
std::string str()
|
|
{
|
|
return "modf";
|
|
}
|
|
|
|
std::string headers()
|
|
{
|
|
return "#include <opencl_math>\n";
|
|
}
|
|
|
|
cl_double2 operator()(const cl_float& x)
|
|
{
|
|
cl_double2 r;
|
|
r.s[0] = (std::modf)(static_cast<cl_double>(x), &(r.s[1]));
|
|
return r;
|
|
}
|
|
|
|
cl_float min1()
|
|
{
|
|
return -1000.0f;
|
|
}
|
|
|
|
cl_float max1()
|
|
{
|
|
return 1000.0f;
|
|
}
|
|
|
|
std::vector<cl_float> in1_special_cases()
|
|
{
|
|
return {
|
|
cl_float(0.0f),
|
|
cl_float(-0.0f),
|
|
cl_float(1.0f),
|
|
cl_float(-1.0f),
|
|
cl_float(2.0f),
|
|
cl_float(-2.0f),
|
|
std::numeric_limits<cl_float>::infinity(),
|
|
-std::numeric_limits<cl_float>::infinity(),
|
|
std::numeric_limits<cl_float>::quiet_NaN()
|
|
};
|
|
}
|
|
|
|
bool use_ulp()
|
|
{
|
|
return true;
|
|
}
|
|
|
|
float ulp()
|
|
{
|
|
if(m_is_embedded)
|
|
{
|
|
return 0.0f;
|
|
}
|
|
return 0.0f;
|
|
}
|
|
private:
|
|
bool m_is_embedded;
|
|
};
|
|
|
|
// We need to specialize generate_kernel_unary<>() function template for fp_func_modf.
|
|
// -----------------------------------------------------------------------------------
|
|
// ------------- ONLY FOR OPENCL 22 CONFORMANCE TEST 22 DEVELOPMENT ------------------
|
|
// -----------------------------------------------------------------------------------
|
|
#if defined(DEVELOPMENT) && defined(USE_OPENCLC_KERNELS)
|
|
template <>
|
|
std::string generate_kernel_unary<fp_func_modf, cl_float, cl_float2>(fp_func_modf func)
|
|
{
|
|
return
|
|
"__kernel void test_modf(global float *input, global float2 *output)\n"
|
|
"{\n"
|
|
" size_t gid = get_global_id(0);\n"
|
|
" float2 result;\n"
|
|
" float itpr = 0;\n"
|
|
" result.x = modf(input[gid], &itpr);\n"
|
|
" result.y = itpr;\n"
|
|
" output[gid] = result;\n"
|
|
"}\n";
|
|
}
|
|
#else
|
|
template <>
|
|
std::string generate_kernel_unary<fp_func_modf, cl_float, cl_float2>(fp_func_modf func)
|
|
{
|
|
return
|
|
"" + func.defs() +
|
|
"" + func.headers() +
|
|
"#include <opencl_memory>\n"
|
|
"#include <opencl_work_item>\n"
|
|
"using namespace cl;\n"
|
|
"__kernel void test_modf(global_ptr<float[]> input, global_ptr<float2[]> output)\n"
|
|
"{\n"
|
|
" size_t gid = get_global_id(0);\n"
|
|
" float2 result;\n"
|
|
" float itpr = 0;\n"
|
|
" result.x = modf(input[gid], &itpr);\n"
|
|
" result.y = itpr;\n"
|
|
" output[gid] = result;\n"
|
|
"}\n";
|
|
}
|
|
#endif
|
|
|
|
// gentype frexp(gentype x, intn* exp);
|
|
//
|
|
// Fuction frexp() returns additional value via pointer (2nd argument). In order to test
|
|
// if it's correct output buffer type is cl_float2. In first compontent we store what
|
|
// modf() function returns, and in the 2nd component we store what is returned via its
|
|
// 2nd argument (intn* exp).
|
|
struct fp_func_frexp : public unary_func<cl_float, cl_float2>
|
|
{
|
|
fp_func_frexp(bool is_embedded) : m_is_embedded(is_embedded)
|
|
{
|
|
|
|
}
|
|
|
|
std::string str()
|
|
{
|
|
return "frexp";
|
|
}
|
|
|
|
std::string headers()
|
|
{
|
|
return "#include <opencl_math>\n";
|
|
}
|
|
|
|
cl_double2 operator()(const cl_float& x)
|
|
{
|
|
cl_double2 r;
|
|
cl_int e;
|
|
r.s[0] = (std::frexp)(static_cast<cl_double>(x), &e);
|
|
r.s[1] = static_cast<cl_float>(e);
|
|
return r;
|
|
}
|
|
|
|
cl_float min1()
|
|
{
|
|
return -1000.0f;
|
|
}
|
|
|
|
cl_float max1()
|
|
{
|
|
return 1000.0f;
|
|
}
|
|
|
|
std::vector<cl_float> in1_special_cases()
|
|
{
|
|
return {
|
|
cl_float(0.0f),
|
|
cl_float(-0.0f),
|
|
cl_float(1.0f),
|
|
cl_float(-1.0f),
|
|
cl_float(2.0f),
|
|
cl_float(-2.0f),
|
|
std::numeric_limits<cl_float>::infinity(),
|
|
-std::numeric_limits<cl_float>::infinity(),
|
|
std::numeric_limits<cl_float>::quiet_NaN()
|
|
};
|
|
}
|
|
|
|
bool use_ulp()
|
|
{
|
|
return true;
|
|
}
|
|
|
|
float ulp()
|
|
{
|
|
if(m_is_embedded)
|
|
{
|
|
return 0.0f;
|
|
}
|
|
return 0.0f;
|
|
}
|
|
private:
|
|
bool m_is_embedded;
|
|
};
|
|
|
|
// We need to specialize generate_kernel_unary<>() function template for fp_func_frexp.
|
|
// -----------------------------------------------------------------------------------
|
|
// ------------- ONLY FOR OPENCL 22 CONFORMANCE TEST 22 DEVELOPMENT ------------------
|
|
// -----------------------------------------------------------------------------------
|
|
#if defined(DEVELOPMENT) && defined(USE_OPENCLC_KERNELS)
|
|
template <>
|
|
std::string generate_kernel_unary<fp_func_frexp, cl_float, cl_float2>(fp_func_frexp func)
|
|
{
|
|
return
|
|
"__kernel void test_frexp(global float *input, global float2 *output)\n"
|
|
"{\n"
|
|
" size_t gid = get_global_id(0);\n"
|
|
" float2 result;\n"
|
|
" int itpr = 0;\n"
|
|
" result.x = frexp(input[gid], &itpr);\n"
|
|
" result.y = itpr;\n"
|
|
" output[gid] = result;\n"
|
|
"}\n";
|
|
}
|
|
#else
|
|
template <>
|
|
std::string generate_kernel_unary<fp_func_frexp, cl_float, cl_float2>(fp_func_frexp func)
|
|
{
|
|
return
|
|
"" + func.defs() +
|
|
"" + func.headers() +
|
|
"#include <opencl_memory>\n"
|
|
"#include <opencl_work_item>\n"
|
|
"using namespace cl;\n"
|
|
"__kernel void test_frexp(global_ptr<float[]> input, global_ptr<float2[]> output)\n"
|
|
"{\n"
|
|
" size_t gid = get_global_id(0);\n"
|
|
" float2 result;\n"
|
|
" int itpr = 0;\n"
|
|
" result.x = frexp(input[gid], &itpr);\n"
|
|
" result.y = itpr;\n"
|
|
" output[gid] = result;\n"
|
|
"}\n";
|
|
}
|
|
#endif
|
|
|
|
// -------------- BINARY FUNCTIONS
|
|
|
|
// gentype copysign(gentype x, gentype y);
|
|
// gentype fmod(gentype x, gentype y);
|
|
// gentype remainder(gentype x, gentype y);
|
|
// group_name, func_name, reference_func, use_ulp, ulp, ulp_for_embedded, max_delta, min1, max1, min2, max2
|
|
MATH_FUNCS_DEFINE_BINARY_FUNC(fp, copysign, std::copysign, true, 0.0f, 0.0f, 0.001f, -100.0f, 100.0f, -10.0f, 10.0f)
|
|
MATH_FUNCS_DEFINE_BINARY_FUNC(fp, fmod, std::fmod, true, 0.0f, 0.0f, 0.001f, -100.0f, 100.0f, -10.0f, 10.0f)
|
|
MATH_FUNCS_DEFINE_BINARY_FUNC(fp, remainder, std::remainder, true, 0.0f, 0.001f, 0.0f, -100.0f, 100.0f, -10.0f, 10.0f)
|
|
|
|
// In case of function float nextafter(float, float) reference function must
|
|
// operate on floats and return float.
|
|
struct fp_func_nextafter : public binary_func<cl_float, cl_float, cl_float>
|
|
{
|
|
fp_func_nextafter(bool is_embedded) : m_is_embedded(is_embedded)
|
|
{
|
|
|
|
}
|
|
|
|
std::string str()
|
|
{
|
|
return "nextafter";
|
|
}
|
|
|
|
std::string headers()
|
|
{
|
|
return "#include <opencl_math>\n";
|
|
}
|
|
|
|
/* In this case reference value type MUST BE cl_float */
|
|
cl_float operator()(const cl_float& x, const cl_float& y)
|
|
{
|
|
return (std::nextafter)(x, y);
|
|
}
|
|
|
|
cl_float min1()
|
|
{
|
|
return -1000.0f;
|
|
}
|
|
|
|
cl_float max1()
|
|
{
|
|
return 500.0f;
|
|
}
|
|
|
|
cl_float min2()
|
|
{
|
|
return 501.0f;
|
|
}
|
|
|
|
cl_float max2()
|
|
{
|
|
return 1000.0f;
|
|
}
|
|
|
|
std::vector<cl_float> in1_special_cases()
|
|
{
|
|
return {
|
|
cl_float(0.0f),
|
|
cl_float(-0.0f),
|
|
cl_float(1.0f),
|
|
cl_float(-1.0f),
|
|
cl_float(2.0f),
|
|
cl_float(-2.0f),
|
|
std::numeric_limits<cl_float>::infinity(),
|
|
-std::numeric_limits<cl_float>::infinity(),
|
|
std::numeric_limits<cl_float>::quiet_NaN()
|
|
};
|
|
}
|
|
|
|
std::vector<cl_float> in2_special_cases()
|
|
{
|
|
return {
|
|
cl_float(0.0f),
|
|
cl_float(-0.0f),
|
|
cl_float(1.0f),
|
|
cl_float(-1.0f),
|
|
cl_float(2.0f),
|
|
cl_float(-2.0f),
|
|
std::numeric_limits<cl_float>::infinity(),
|
|
-std::numeric_limits<cl_float>::infinity(),
|
|
std::numeric_limits<cl_float>::quiet_NaN()
|
|
};
|
|
}
|
|
|
|
bool use_ulp()
|
|
{
|
|
return true;
|
|
}
|
|
|
|
float ulp()
|
|
{
|
|
if(m_is_embedded)
|
|
{
|
|
return 0.0f;
|
|
}
|
|
return 0.0f;
|
|
}
|
|
private:
|
|
bool m_is_embedded;
|
|
};
|
|
|
|
// gentype remquo(gentype x, gentype y, intn* quo);
|
|
struct fp_func_remquo : public binary_func<cl_float, cl_float, cl_float2>
|
|
{
|
|
fp_func_remquo(bool is_embedded) : m_is_embedded(is_embedded)
|
|
{
|
|
|
|
}
|
|
|
|
std::string str()
|
|
{
|
|
return "remquo";
|
|
}
|
|
|
|
std::string headers()
|
|
{
|
|
return "#include <opencl_math>\n";
|
|
}
|
|
|
|
cl_double2 operator()(const cl_float& x, const cl_float& y)
|
|
{
|
|
return reference::remquo(static_cast<cl_double>(x), static_cast<cl_double>(y));
|
|
}
|
|
|
|
cl_float min1()
|
|
{
|
|
return -1000.0f;
|
|
}
|
|
|
|
cl_float max1()
|
|
{
|
|
return 1000.0f;
|
|
}
|
|
|
|
cl_float min2()
|
|
{
|
|
return -1000.0f;
|
|
}
|
|
|
|
cl_float max2()
|
|
{
|
|
return 1000.0f;
|
|
}
|
|
|
|
std::vector<cl_float> in1_special_cases()
|
|
{
|
|
return {
|
|
cl_float(0.0f),
|
|
cl_float(-0.0f),
|
|
cl_float(1.0f),
|
|
cl_float(-1.0f),
|
|
std::numeric_limits<cl_float>::infinity(),
|
|
-std::numeric_limits<cl_float>::infinity(),
|
|
std::numeric_limits<cl_float>::quiet_NaN()
|
|
};
|
|
}
|
|
|
|
std::vector<cl_float> in2_special_cases()
|
|
{
|
|
return {
|
|
cl_float(0.0f),
|
|
cl_float(-0.0f),
|
|
cl_float(1.0f),
|
|
cl_float(-1.0f),
|
|
std::numeric_limits<cl_float>::infinity(),
|
|
-std::numeric_limits<cl_float>::infinity(),
|
|
std::numeric_limits<cl_float>::quiet_NaN()
|
|
};
|
|
}
|
|
|
|
bool use_ulp()
|
|
{
|
|
return true;
|
|
}
|
|
|
|
float ulp()
|
|
{
|
|
if(m_is_embedded)
|
|
{
|
|
return 0.0f;
|
|
}
|
|
return 0.0f;
|
|
}
|
|
private:
|
|
bool m_is_embedded;
|
|
};
|
|
|
|
|
|
// We need to specialize generate_kernel_binary<>() function template for fp_func_remquo.
|
|
// -----------------------------------------------------------------------------------
|
|
// ------------- ONLY FOR OPENCL 22 CONFORMANCE TEST 22 DEVELOPMENT ------------------
|
|
// -----------------------------------------------------------------------------------
|
|
#if defined(DEVELOPMENT) && defined(USE_OPENCLC_KERNELS)
|
|
template <>
|
|
std::string generate_kernel_binary<fp_func_remquo, cl_float, cl_float, cl_float2>(fp_func_remquo func)
|
|
{
|
|
return
|
|
"__kernel void test_remquo(global float *input1, global float *input2, global float2 *output)\n"
|
|
"{\n"
|
|
" size_t gid = get_global_id(0);\n"
|
|
" float2 result;\n"
|
|
" int quo = 0;\n"
|
|
" int sign = 0;\n"
|
|
" result.x = remquo(input1[gid], input2[gid], &quo);\n"
|
|
// Specification say:
|
|
// "remquo also calculates the lower seven bits of the integral quotient x/y,
|
|
// and gives that value the same sign as x/y. It stores this signed value in
|
|
// the object pointed to by quo."
|
|
// Implemenation may save into quo more than seven bits. We need to take
|
|
// care of that here.
|
|
" sign = (quo < 0) ? -1 : 1;\n"
|
|
" quo = (quo < 0) ? -quo : quo;\n"
|
|
" quo &= 0x0000007f;\n"
|
|
" result.y = (sign < 0) ? -quo : quo;\n"
|
|
" output[gid] = result;\n"
|
|
"}\n";
|
|
}
|
|
#else
|
|
template <>
|
|
std::string generate_kernel_binary<fp_func_remquo, cl_float, cl_float, cl_float2>(fp_func_remquo func)
|
|
{
|
|
return
|
|
"" + func.defs() +
|
|
"" + func.headers() +
|
|
"#include <opencl_memory>\n"
|
|
"#include <opencl_work_item>\n"
|
|
"using namespace cl;\n"
|
|
"__kernel void test_remquo(global_ptr<float[]> input1, global_ptr<float[]> input2, global_ptr<float2[]> output)\n"
|
|
"{\n"
|
|
" size_t gid = get_global_id(0);\n"
|
|
" float2 result;\n"
|
|
" int quo = 0;\n"
|
|
" int sign = 0;\n"
|
|
" result.x = remquo(input1[gid], input2[gid], &quo);\n"
|
|
// Specification say:
|
|
// "remquo also calculates the lower seven bits of the integral quotient x/y,
|
|
// and gives that value the same sign as x/y. It stores this signed value in
|
|
// the object pointed to by quo."
|
|
// Implemenation may save into quo more than seven bits. We need to take
|
|
// care of that here.
|
|
" sign = (quo < 0) ? -1 : 1;\n"
|
|
" quo = (quo < 0) ? -quo : quo;\n"
|
|
" quo &= 0x0000007f;\n"
|
|
" result.y = (sign < 0) ? -quo : quo;\n"
|
|
" output[gid] = result;\n"
|
|
"}\n";
|
|
}
|
|
#endif
|
|
|
|
// -------------- TERNARY FUNCTIONS
|
|
|
|
// gentype fma(gentype a, gentype b, gentype c);
|
|
// group_name, func_name, reference_func, use_ulp, ulp, ulp_for_embedded, max_delta, min1, max1, min2, max2, min3, max3
|
|
MATH_FUNCS_DEFINE_TERNARY_FUNC(fp, fma, std::fma, true, 0.0f, 0.0f, 0.001f, -1000.0f, 1000.0f, -1000.0f, 1000.0f, -1000.0f, 1000.0f)
|
|
|
|
// floating point functions
|
|
AUTO_TEST_CASE(test_fp_funcs)
|
|
(cl_device_id device, cl_context context, cl_command_queue queue, int n_elems)
|
|
{
|
|
int error = CL_SUCCESS;
|
|
int last_error = CL_SUCCESS;
|
|
|
|
// Check for EMBEDDED_PROFILE
|
|
bool is_embedded_profile = false;
|
|
char profile[128];
|
|
last_error = clGetDeviceInfo(device, CL_DEVICE_PROFILE, sizeof(profile), (void *)&profile, NULL);
|
|
RETURN_ON_CL_ERROR(last_error, "clGetDeviceInfo")
|
|
if (std::strcmp(profile, "EMBEDDED_PROFILE") == 0)
|
|
is_embedded_profile = true;
|
|
|
|
// gentype ceil(gentype x);
|
|
TEST_UNARY_FUNC_MACRO((fp_func_ceil(is_embedded_profile)))
|
|
// gentype floor(gentype x);
|
|
TEST_UNARY_FUNC_MACRO((fp_func_floor(is_embedded_profile)))
|
|
// gentype rint(gentype x);
|
|
TEST_UNARY_FUNC_MACRO((fp_func_rint(is_embedded_profile)))
|
|
// gentype round(gentype x);
|
|
TEST_UNARY_FUNC_MACRO((fp_func_round(is_embedded_profile)))
|
|
// gentype trunc(gentype x);
|
|
TEST_UNARY_FUNC_MACRO((fp_func_trunc(is_embedded_profile)))
|
|
|
|
// floatn nan(uintn nancode);
|
|
TEST_UNARY_FUNC_MACRO((fp_func_nan()))
|
|
|
|
// gentype fract(gentype x, gentype* iptr);
|
|
TEST_UNARY_FUNC_MACRO((fp_func_fract(is_embedded_profile)))
|
|
// gentype modf(gentype x, gentype* iptr);
|
|
TEST_UNARY_FUNC_MACRO((fp_func_modf(is_embedded_profile)))
|
|
// gentype frexp(gentype x, intn* exp);
|
|
TEST_UNARY_FUNC_MACRO((fp_func_frexp(is_embedded_profile)))
|
|
|
|
// gentype remainder(gentype x, gentype y);
|
|
TEST_BINARY_FUNC_MACRO((fp_func_remainder(is_embedded_profile)))
|
|
// gentype copysign(gentype x, gentype y);
|
|
TEST_BINARY_FUNC_MACRO((fp_func_copysign(is_embedded_profile)))
|
|
// gentype fmod(gentype x, gentype y);
|
|
TEST_BINARY_FUNC_MACRO((fp_func_fmod(is_embedded_profile)))
|
|
|
|
// gentype nextafter(gentype x, gentype y);
|
|
TEST_BINARY_FUNC_MACRO((fp_func_nextafter(is_embedded_profile)))
|
|
|
|
// gentype remquo(gentype x, gentype y, intn* quo);
|
|
TEST_BINARY_FUNC_MACRO((fp_func_remquo(is_embedded_profile)))
|
|
|
|
// gentype fma(gentype a, gentype b, gentype c);
|
|
TEST_TERNARY_FUNC_MACRO((fp_func_fma(is_embedded_profile)))
|
|
|
|
if(error != CL_SUCCESS)
|
|
{
|
|
return -1;
|
|
}
|
|
return error;
|
|
}
|
|
|
|
#endif // TEST_CONFORMANCE_CLCPP_MATH_FUNCS_FP_FUNCS_HPP
|