2020-02-08 23:01:28 +00:00
|
|
|
/*
|
|
|
|
* Copyright 2011-2016 Blender Foundation
|
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "testing/testing.h"
|
|
|
|
#include "util/util_system.h"
|
2020-03-19 08:33:03 +00:00
|
|
|
#include "util/util_types.h"
|
2020-02-08 23:01:28 +00:00
|
|
|
|
|
|
|
CCL_NAMESPACE_BEGIN
|
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
static bool validate_cpu_capabilities()
|
2020-02-08 23:01:28 +00:00
|
|
|
{
|
|
|
|
|
|
|
|
#ifdef __KERNEL_AVX2__
|
2020-02-11 07:45:08 +00:00
|
|
|
return system_cpu_support_avx2();
|
2020-02-08 23:01:28 +00:00
|
|
|
#else
|
|
|
|
# ifdef __KERNEL_AVX__
|
2020-02-11 07:45:08 +00:00
|
|
|
return system_cpu_support_avx();
|
2020-02-08 23:01:28 +00:00
|
|
|
# endif
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2020-02-11 07:45:08 +00:00
|
|
|
#define VALIDATECPU \
|
|
|
|
if (!validate_cpu_capabilities()) \
|
|
|
|
return;
|
2020-02-08 23:01:28 +00:00
|
|
|
|
2020-02-11 07:45:08 +00:00
|
|
|
#define compare_vector_scalar(a, b) \
|
|
|
|
for (size_t index = 0; index < a.size; index++) \
|
|
|
|
EXPECT_FLOAT_EQ(a[index], b);
|
2020-02-08 23:01:28 +00:00
|
|
|
|
2020-02-11 07:45:08 +00:00
|
|
|
#define compare_vector_vector(a, b) \
|
|
|
|
for (size_t index = 0; index < a.size; index++) \
|
|
|
|
EXPECT_FLOAT_EQ(a[index], b[index]);
|
2020-02-08 23:01:28 +00:00
|
|
|
|
2020-02-18 13:42:35 +00:00
|
|
|
#define compare_vector_vector_near(a, b, abserror) \
|
|
|
|
for (size_t index = 0; index < a.size; index++) \
|
|
|
|
EXPECT_NEAR(a[index], b[index], abserror);
|
|
|
|
|
2020-02-11 07:45:08 +00:00
|
|
|
#define basic_test_vv(a, b, op) \
|
|
|
|
VALIDATECPU \
|
|
|
|
avxf c = a op b; \
|
|
|
|
for (size_t i = 0; i < a.size; i++) \
|
|
|
|
EXPECT_FLOAT_EQ(c[i], a[i] op b[i]);
|
2020-02-08 23:01:28 +00:00
|
|
|
|
|
|
|
/* vector op float tests */
|
2020-02-11 07:45:08 +00:00
|
|
|
#define basic_test_vf(a, b, op) \
|
|
|
|
VALIDATECPU \
|
|
|
|
avxf c = a op b; \
|
|
|
|
for (size_t i = 0; i < a.size; i++) \
|
|
|
|
EXPECT_FLOAT_EQ(c[i], a[i] op b);
|
2020-02-08 23:01:28 +00:00
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
static const avxf avxf_a(0.1f, 0.2f, 0.3f, 0.4f, 0.5f, 0.6f, 0.7f, 0.8f);
|
|
|
|
static const avxf avxf_b(1.0f, 2.0f, 3.0f, 4.0f, 5.0f, 6.0f, 7.0f, 8.0f);
|
|
|
|
static const avxf avxf_c(1.1f, 2.2f, 3.3f, 4.4f, 5.5f, 6.6f, 7.7f, 8.8f);
|
|
|
|
static const float float_b = 1.5f;
|
|
|
|
|
|
|
|
TEST(TEST_CATEGORY_NAME, avxf_add_vv){basic_test_vv(avxf_a, avxf_b, +)} TEST(TEST_CATEGORY_NAME,
|
|
|
|
avxf_sub_vv){
|
|
|
|
basic_test_vv(avxf_a, avxf_b, -)} TEST(TEST_CATEGORY_NAME, avxf_mul_vv){
|
|
|
|
basic_test_vv(avxf_a, avxf_b, *)} TEST(TEST_CATEGORY_NAME, avxf_div_vv){
|
|
|
|
basic_test_vv(avxf_a, avxf_b, /)} TEST(TEST_CATEGORY_NAME, avxf_add_vf){
|
|
|
|
basic_test_vf(avxf_a, float_b, +)} TEST(TEST_CATEGORY_NAME, avxf_sub_vf){
|
|
|
|
basic_test_vf(avxf_a, float_b, -)} TEST(TEST_CATEGORY_NAME, avxf_mul_vf){
|
|
|
|
basic_test_vf(avxf_a, float_b, *)} TEST(TEST_CATEGORY_NAME,
|
2020-02-11 07:45:08 +00:00
|
|
|
avxf_div_vf){basic_test_vf(avxf_a, float_b, /)}
|
2020-02-08 23:01:28 +00:00
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
TEST(TEST_CATEGORY_NAME, avxf_ctor)
|
2020-02-08 23:01:28 +00:00
|
|
|
{
|
2020-02-11 07:45:08 +00:00
|
|
|
VALIDATECPU
|
|
|
|
compare_vector_scalar(avxf(7.0f, 6.0f, 5.0f, 4.0f, 3.0f, 2.0f, 1.0f, 0.0f),
|
|
|
|
static_cast<float>(index));
|
|
|
|
compare_vector_scalar(avxf(1.0f), 1.0f);
|
|
|
|
compare_vector_vector(avxf(1.0f, 2.0f), avxf(1.0f, 1.0f, 1.0f, 1.0f, 2.0f, 2.0f, 2.0f, 2.0f));
|
|
|
|
compare_vector_vector(avxf(1.0f, 2.0f, 3.0f, 4.0f),
|
|
|
|
avxf(1.0f, 2.0f, 3.0f, 4.0f, 1.0f, 2.0f, 3.0f, 4.0f));
|
|
|
|
compare_vector_vector(avxf(make_float3(1.0f, 2.0f, 3.0f)),
|
|
|
|
avxf(0.0f, 3.0f, 2.0f, 1.0f, 0.0f, 3.0f, 2.0f, 1.0f));
|
2020-02-08 23:01:28 +00:00
|
|
|
}
|
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
TEST(TEST_CATEGORY_NAME, avxf_sqrt)
|
2020-02-08 23:01:28 +00:00
|
|
|
{
|
2020-02-11 07:45:08 +00:00
|
|
|
VALIDATECPU
|
|
|
|
compare_vector_vector(mm256_sqrt(avxf(1.0f, 4.0f, 9.0f, 16.0f, 25.0f, 36.0f, 49.0f, 64.0f)),
|
|
|
|
avxf(1.0f, 2.0f, 3.0f, 4.0f, 5.0f, 6.0f, 7.0f, 8.0f));
|
2020-02-08 23:01:28 +00:00
|
|
|
}
|
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
TEST(TEST_CATEGORY_NAME, avxf_min_max)
|
2020-02-08 23:01:28 +00:00
|
|
|
{
|
2020-02-11 07:45:08 +00:00
|
|
|
VALIDATECPU
|
|
|
|
compare_vector_vector(min(avxf_a, avxf_b), avxf_a);
|
|
|
|
compare_vector_vector(max(avxf_a, avxf_b), avxf_b);
|
2020-02-08 23:01:28 +00:00
|
|
|
}
|
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
TEST(TEST_CATEGORY_NAME, avxf_set_sign)
|
2020-02-08 23:01:28 +00:00
|
|
|
{
|
2020-02-11 07:45:08 +00:00
|
|
|
VALIDATECPU
|
|
|
|
avxf res = set_sign_bit<1, 0, 0, 0, 0, 0, 0, 0>(avxf_a);
|
|
|
|
compare_vector_vector(res, avxf(0.1f, 0.2f, 0.3f, 0.4f, 0.5f, 0.6f, 0.7f, -0.8f));
|
2020-02-08 23:01:28 +00:00
|
|
|
}
|
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
TEST(TEST_CATEGORY_NAME, avxf_msub)
|
2020-02-08 23:01:28 +00:00
|
|
|
{
|
2020-02-11 07:45:08 +00:00
|
|
|
VALIDATECPU
|
|
|
|
avxf res = msub(avxf_a, avxf_b, avxf_c);
|
|
|
|
avxf exp = avxf((avxf_a[7] * avxf_b[7]) - avxf_c[7],
|
|
|
|
(avxf_a[6] * avxf_b[6]) - avxf_c[6],
|
|
|
|
(avxf_a[5] * avxf_b[5]) - avxf_c[5],
|
|
|
|
(avxf_a[4] * avxf_b[4]) - avxf_c[4],
|
|
|
|
(avxf_a[3] * avxf_b[3]) - avxf_c[3],
|
|
|
|
(avxf_a[2] * avxf_b[2]) - avxf_c[2],
|
|
|
|
(avxf_a[1] * avxf_b[1]) - avxf_c[1],
|
|
|
|
(avxf_a[0] * avxf_b[0]) - avxf_c[0]);
|
|
|
|
compare_vector_vector(res, exp);
|
2020-02-08 23:01:28 +00:00
|
|
|
}
|
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
TEST(TEST_CATEGORY_NAME, avxf_madd)
|
2020-02-08 23:01:28 +00:00
|
|
|
{
|
2020-02-11 07:45:08 +00:00
|
|
|
VALIDATECPU
|
|
|
|
avxf res = madd(avxf_a, avxf_b, avxf_c);
|
|
|
|
avxf exp = avxf((avxf_a[7] * avxf_b[7]) + avxf_c[7],
|
|
|
|
(avxf_a[6] * avxf_b[6]) + avxf_c[6],
|
|
|
|
(avxf_a[5] * avxf_b[5]) + avxf_c[5],
|
|
|
|
(avxf_a[4] * avxf_b[4]) + avxf_c[4],
|
|
|
|
(avxf_a[3] * avxf_b[3]) + avxf_c[3],
|
|
|
|
(avxf_a[2] * avxf_b[2]) + avxf_c[2],
|
|
|
|
(avxf_a[1] * avxf_b[1]) + avxf_c[1],
|
|
|
|
(avxf_a[0] * avxf_b[0]) + avxf_c[0]);
|
|
|
|
compare_vector_vector(res, exp);
|
2020-02-08 23:01:28 +00:00
|
|
|
}
|
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
TEST(TEST_CATEGORY_NAME, avxf_nmadd)
|
2020-02-08 23:01:28 +00:00
|
|
|
{
|
2020-02-11 07:45:08 +00:00
|
|
|
VALIDATECPU
|
|
|
|
avxf res = nmadd(avxf_a, avxf_b, avxf_c);
|
|
|
|
avxf exp = avxf(avxf_c[7] - (avxf_a[7] * avxf_b[7]),
|
|
|
|
avxf_c[6] - (avxf_a[6] * avxf_b[6]),
|
|
|
|
avxf_c[5] - (avxf_a[5] * avxf_b[5]),
|
|
|
|
avxf_c[4] - (avxf_a[4] * avxf_b[4]),
|
|
|
|
avxf_c[3] - (avxf_a[3] * avxf_b[3]),
|
|
|
|
avxf_c[2] - (avxf_a[2] * avxf_b[2]),
|
|
|
|
avxf_c[1] - (avxf_a[1] * avxf_b[1]),
|
|
|
|
avxf_c[0] - (avxf_a[0] * avxf_b[0]));
|
|
|
|
compare_vector_vector(res, exp);
|
2020-02-08 23:01:28 +00:00
|
|
|
}
|
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
TEST(TEST_CATEGORY_NAME, avxf_compare)
|
2020-02-08 23:01:28 +00:00
|
|
|
{
|
2020-02-11 07:45:08 +00:00
|
|
|
VALIDATECPU
|
|
|
|
avxf a(0.0f, 1.0f, 2.0f, 3.0f, 4.0f, 5.0f, 6.0f, 7.0f);
|
|
|
|
avxf b(7.0f, 6.0f, 5.0f, 4.0f, 3.0f, 2.0f, 1.0f, 0.0f);
|
|
|
|
avxb res = a <= b;
|
|
|
|
int exp[8] = {
|
|
|
|
a[0] <= b[0] ? -1 : 0,
|
|
|
|
a[1] <= b[1] ? -1 : 0,
|
|
|
|
a[2] <= b[2] ? -1 : 0,
|
|
|
|
a[3] <= b[3] ? -1 : 0,
|
|
|
|
a[4] <= b[4] ? -1 : 0,
|
|
|
|
a[5] <= b[5] ? -1 : 0,
|
|
|
|
a[6] <= b[6] ? -1 : 0,
|
|
|
|
a[7] <= b[7] ? -1 : 0,
|
|
|
|
};
|
|
|
|
compare_vector_vector(res, exp);
|
2020-02-08 23:01:28 +00:00
|
|
|
}
|
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
TEST(TEST_CATEGORY_NAME, avxf_permute)
|
2020-02-08 23:01:28 +00:00
|
|
|
{
|
2020-02-11 07:45:08 +00:00
|
|
|
VALIDATECPU
|
|
|
|
avxf res = permute<3, 0, 1, 7, 6, 5, 2, 4>(avxf_b);
|
|
|
|
compare_vector_vector(res, avxf(4.0f, 6.0f, 3.0f, 2.0f, 1.0f, 7.0f, 8.0f, 5.0f));
|
2020-02-08 23:01:28 +00:00
|
|
|
}
|
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
TEST(TEST_CATEGORY_NAME, avxf_blend)
|
2020-02-08 23:01:28 +00:00
|
|
|
{
|
2020-02-11 07:45:08 +00:00
|
|
|
VALIDATECPU
|
|
|
|
avxf res = blend<0, 0, 1, 0, 1, 0, 1, 0>(avxf_a, avxf_b);
|
|
|
|
compare_vector_vector(res, avxf(0.1f, 0.2f, 3.0f, 0.4f, 5.0f, 0.6f, 7.0f, 0.8f));
|
2020-02-08 23:01:28 +00:00
|
|
|
}
|
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
TEST(TEST_CATEGORY_NAME, avxf_shuffle)
|
2020-02-08 23:01:28 +00:00
|
|
|
{
|
2020-02-11 07:45:08 +00:00
|
|
|
VALIDATECPU
|
|
|
|
avxf res = shuffle<0, 1, 2, 3, 1, 3, 2, 0>(avxf_a);
|
|
|
|
compare_vector_vector(res, avxf(0.4f, 0.2f, 0.1f, 0.3f, 0.5f, 0.6f, 0.7f, 0.8f));
|
2020-02-08 23:01:28 +00:00
|
|
|
}
|
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
TEST(TEST_CATEGORY_NAME, avxf_cross)
|
2020-02-08 23:01:28 +00:00
|
|
|
{
|
2020-02-18 13:42:35 +00:00
|
|
|
VALIDATECPU
|
|
|
|
avxf res = cross(avxf_b, avxf_c);
|
|
|
|
compare_vector_vector_near(res,
|
|
|
|
avxf(0.0f,
|
|
|
|
-9.5367432e-07f,
|
|
|
|
0.0f,
|
|
|
|
4.7683716e-07f,
|
|
|
|
0.0f,
|
|
|
|
-3.8146973e-06f,
|
|
|
|
3.8146973e-06f,
|
|
|
|
3.8146973e-06f),
|
|
|
|
0.000002000f);
|
2020-02-08 23:01:28 +00:00
|
|
|
}
|
|
|
|
|
2020-09-15 09:16:35 +00:00
|
|
|
TEST(TEST_CATEGORY_NAME, avxf_dot3)
|
2020-02-08 23:01:28 +00:00
|
|
|
{
|
2020-02-11 07:45:08 +00:00
|
|
|
VALIDATECPU
|
|
|
|
float den, den2;
|
|
|
|
dot3(avxf_a, avxf_b, den, den2);
|
|
|
|
EXPECT_FLOAT_EQ(den, 14.9f);
|
|
|
|
EXPECT_FLOAT_EQ(den2, 2.9f);
|
2020-02-08 23:01:28 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
CCL_NAMESPACE_END
|