blob: 59f747dfc06ffe9973a0215b4021a2366ca68ae4 [file] [log] [blame] [edit]
// Copyright 2016 The SwiftShader Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#include "Coroutine.hpp"
#include "Print.hpp"
#include "Reactor.hpp"
#include "gtest/gtest.h"
#include <array>
#include <cmath>
#include <thread>
#include <tuple>
using namespace rr;
int reference(int *p, int y)
{
int x = p[-1];
int z = 4;
for(int i = 0; i < 10; i++)
{
z += (2 << i) - (i / 3);
}
int sum = x + y + z;
return sum;
}
TEST(ReactorUnitTests, Sample)
{
FunctionT<int(int *, int)> function;
{
Pointer<Int> p = function.Arg<0>();
Int x = p[-1];
Int y = function.Arg<1>();
Int z = 4;
For(Int i = 0, i < 10, i++)
{
z += (2 << i) - (i / 3);
}
Float4 v;
v.z = As<Float>(z);
z = As<Int>(Float(Float4(v.xzxx).y));
Int sum = x + y + z;
Return(sum);
}
auto routine = function("one");
int one[2] = { 1, 0 };
int result = routine(&one[1], 2);
EXPECT_EQ(result, reference(&one[1], 2));
}
TEST(ReactorUnitTests, Uninitialized)
{
FunctionT<int()> function;
{
Int a;
Int z = 4;
Int q;
Int c;
Int p;
Bool b;
q += q;
If(b)
{
c = p;
}
Return(a + z + q + c);
}
auto routine = function("one");
int result = routine();
EXPECT_EQ(result, result); // Anything is fine, just don't crash
}
TEST(ReactorUnitTests, Unreachable)
{
FunctionT<int(int)> function;
{
Int a = function.Arg<0>();
Int z = 4;
Return(a + z);
// Code beyond this point is unreachable but should not cause any
// compilation issues.
z += a;
}
auto routine = function("one");
int result = routine(16);
EXPECT_EQ(result, 20);
}
TEST(ReactorUnitTests, VariableAddress)
{
FunctionT<int(int)> function;
{
Int a = function.Arg<0>();
Int z = 0;
Pointer<Int> p = &z;
*p = 4;
Return(a + z);
}
auto routine = function("one");
int result = routine(16);
EXPECT_EQ(result, 20);
}
TEST(ReactorUnitTests, SubVectorLoadStore)
{
FunctionT<int(void *, void *)> function;
{
Pointer<Byte> in = function.Arg<0>();
Pointer<Byte> out = function.Arg<1>();
*Pointer<Int4>(out + 16 * 0) = *Pointer<Int4>(in + 16 * 0);
*Pointer<Short4>(out + 16 * 1) = *Pointer<Short4>(in + 16 * 1);
*Pointer<Byte8>(out + 16 * 2) = *Pointer<Byte8>(in + 16 * 2);
*Pointer<Byte4>(out + 16 * 3) = *Pointer<Byte4>(in + 16 * 3);
*Pointer<Short2>(out + 16 * 4) = *Pointer<Short2>(in + 16 * 4);
Return(0);
}
auto routine = function("one");
int8_t in[16 * 5] = { 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16,
17, 18, 19, 20, 21, 22, 23, 24, 0, 0, 0, 0, 0, 0, 0, 0,
25, 26, 27, 28, 29, 30, 31, 32, 0, 0, 0, 0, 0, 0, 0, 0,
33, 34, 35, 36, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
37, 38, 39, 40, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 };
int8_t out[16 * 5] = { -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 };
routine(in, out);
for(int row = 0; row < 5; row++)
{
for(int col = 0; col < 16; col++)
{
int i = row * 16 + col;
if(in[i] == 0)
{
EXPECT_EQ(out[i], -1) << "Row " << row << " column " << col << " not left untouched.";
}
else
{
EXPECT_EQ(out[i], in[i]) << "Row " << row << " column " << col << " not equal to input.";
}
}
}
}
TEST(ReactorUnitTests, VectorConstant)
{
FunctionT<int(void *)> function;
{
Pointer<Byte> out = function.Arg<0>();
*Pointer<Int4>(out + 16 * 0) = Int4(0x04030201, 0x08070605, 0x0C0B0A09, 0x100F0E0D);
*Pointer<Short4>(out + 16 * 1) = Short4(0x1211, 0x1413, 0x1615, 0x1817);
*Pointer<Byte8>(out + 16 * 2) = Byte8(0x19, 0x1A, 0x1B, 0x1C, 0x1D, 0x1E, 0x1F, 0x20);
*Pointer<Int2>(out + 16 * 3) = Int2(0x24232221, 0x28272625);
Return(0);
}
auto routine = function("one");
int8_t out[16 * 4] = { -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 };
int8_t exp[16 * 4] = { 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16,
17, 18, 19, 20, 21, 22, 23, 24, -1, -1, -1, -1, -1, -1, -1, -1,
25, 26, 27, 28, 29, 30, 31, 32, -1, -1, -1, -1, -1, -1, -1, -1,
33, 34, 35, 36, 37, 38, 39, 40, -1, -1, -1, -1, -1, -1, -1, -1 };
routine(out);
for(int row = 0; row < 4; row++)
{
for(int col = 0; col < 16; col++)
{
int i = row * 16 + col;
EXPECT_EQ(out[i], exp[i]);
}
}
}
TEST(ReactorUnitTests, Concatenate)
{
FunctionT<int(void *)> function;
{
Pointer<Byte> out = function.Arg<0>();
*Pointer<Int4>(out + 16 * 0) = Int4(Int2(0x04030201, 0x08070605), Int2(0x0C0B0A09, 0x100F0E0D));
*Pointer<Short8>(out + 16 * 1) = Short8(Short4(0x0201, 0x0403, 0x0605, 0x0807), Short4(0x0A09, 0x0C0B, 0x0E0D, 0x100F));
Return(0);
}
auto routine = function("one");
int8_t ref[16 * 5] = { 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16,
1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16 };
int8_t out[16 * 5] = { -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,
-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 };
routine(out);
for(int row = 0; row < 2; row++)
{
for(int col = 0; col < 16; col++)
{
int i = row * 16 + col;
EXPECT_EQ(out[i], ref[i]) << "Row " << row << " column " << col << " not equal to reference.";
}
}
}
TEST(ReactorUnitTests, Cast)
{
FunctionT<void(void *)> function;
{
Pointer<Byte> out = function.Arg<0>();
Int4 c = Int4(0x01020304, 0x05060708, 0x09101112, 0x13141516);
*Pointer<Short4>(out + 16 * 0) = Short4(c);
*Pointer<Byte4>(out + 16 * 1 + 0) = Byte4(c);
*Pointer<Byte4>(out + 16 * 1 + 4) = Byte4(As<Byte8>(c));
*Pointer<Byte4>(out + 16 * 1 + 8) = Byte4(As<Short4>(c));
}
auto routine = function("one");
int out[2][4];
memset(&out, 0, sizeof(out));
routine(&out);
EXPECT_EQ(out[0][0], 0x07080304);
EXPECT_EQ(out[0][1], 0x15161112);
EXPECT_EQ(out[1][0], 0x16120804);
EXPECT_EQ(out[1][1], 0x01020304);
EXPECT_EQ(out[1][2], 0x06080204);
}
static uint16_t swizzleCode4(int i)
{
auto x = (i >> 0) & 0x03;
auto y = (i >> 2) & 0x03;
auto z = (i >> 4) & 0x03;
auto w = (i >> 6) & 0x03;
return static_cast<uint16_t>((x << 12) | (y << 8) | (z << 4) | (w << 0));
}
TEST(ReactorUnitTests, Swizzle4)
{
FunctionT<void(void *)> function;
{
Pointer<Byte> out = function.Arg<0>();
for(int i = 0; i < 256; i++)
{
*Pointer<Float4>(out + 16 * i) = Swizzle(Float4(1.0f, 2.0f, 3.0f, 4.0f), swizzleCode4(i));
}
for(int i = 0; i < 256; i++)
{
*Pointer<Float4>(out + 16 * (256 + i)) = ShuffleLowHigh(Float4(1.0f, 2.0f, 3.0f, 4.0f), Float4(5.0f, 6.0f, 7.0f, 8.0f), swizzleCode4(i));
}
*Pointer<Float4>(out + 16 * (512 + 0)) = UnpackLow(Float4(1.0f, 2.0f, 3.0f, 4.0f), Float4(5.0f, 6.0f, 7.0f, 8.0f));
*Pointer<Float4>(out + 16 * (512 + 1)) = UnpackHigh(Float4(1.0f, 2.0f, 3.0f, 4.0f), Float4(5.0f, 6.0f, 7.0f, 8.0f));
*Pointer<Int2>(out + 16 * (512 + 2)) = UnpackLow(Short4(1, 2, 3, 4), Short4(5, 6, 7, 8));
*Pointer<Int2>(out + 16 * (512 + 3)) = UnpackHigh(Short4(1, 2, 3, 4), Short4(5, 6, 7, 8));
*Pointer<Short4>(out + 16 * (512 + 4)) = UnpackLow(Byte8(1, 2, 3, 4, 5, 6, 7, 8), Byte8(9, 10, 11, 12, 13, 14, 15, 16));
*Pointer<Short4>(out + 16 * (512 + 5)) = UnpackHigh(Byte8(1, 2, 3, 4, 5, 6, 7, 8), Byte8(9, 10, 11, 12, 13, 14, 15, 16));
for(int i = 0; i < 256; i++)
{
*Pointer<Short4>(out + 16 * (512 + 6) + (8 * i)) =
Swizzle(Short4(1, 2, 3, 4), swizzleCode4(i));
}
for(int i = 0; i < 256; i++)
{
*Pointer<Int4>(out + 16 * (512 + 6 + i) + (8 * 256)) =
Swizzle(Int4(1, 2, 3, 4), swizzleCode4(i));
}
}
auto routine = function("one");
struct
{
float f[256 + 256 + 2][4];
int i[388][4];
} out;
memset(&out, 0, sizeof(out));
routine(&out);
for(int i = 0; i < 256; i++)
{
EXPECT_EQ(out.f[i][0], float((i >> 0) & 0x03) + 1.0f);
EXPECT_EQ(out.f[i][1], float((i >> 2) & 0x03) + 1.0f);
EXPECT_EQ(out.f[i][2], float((i >> 4) & 0x03) + 1.0f);
EXPECT_EQ(out.f[i][3], float((i >> 6) & 0x03) + 1.0f);
}
for(int i = 0; i < 256; i++)
{
EXPECT_EQ(out.f[256 + i][0], float((i >> 0) & 0x03) + 1.0f);
EXPECT_EQ(out.f[256 + i][1], float((i >> 2) & 0x03) + 1.0f);
EXPECT_EQ(out.f[256 + i][2], float((i >> 4) & 0x03) + 5.0f);
EXPECT_EQ(out.f[256 + i][3], float((i >> 6) & 0x03) + 5.0f);
}
EXPECT_EQ(out.f[512 + 0][0], 1.0f);
EXPECT_EQ(out.f[512 + 0][1], 5.0f);
EXPECT_EQ(out.f[512 + 0][2], 2.0f);
EXPECT_EQ(out.f[512 + 0][3], 6.0f);
EXPECT_EQ(out.f[512 + 1][0], 3.0f);
EXPECT_EQ(out.f[512 + 1][1], 7.0f);
EXPECT_EQ(out.f[512 + 1][2], 4.0f);
EXPECT_EQ(out.f[512 + 1][3], 8.0f);
EXPECT_EQ(out.i[0][0], 0x00050001);
EXPECT_EQ(out.i[0][1], 0x00060002);
EXPECT_EQ(out.i[0][2], 0x00000000);
EXPECT_EQ(out.i[0][3], 0x00000000);
EXPECT_EQ(out.i[1][0], 0x00070003);
EXPECT_EQ(out.i[1][1], 0x00080004);
EXPECT_EQ(out.i[1][2], 0x00000000);
EXPECT_EQ(out.i[1][3], 0x00000000);
EXPECT_EQ(out.i[2][0], 0x0A020901);
EXPECT_EQ(out.i[2][1], 0x0C040B03);
EXPECT_EQ(out.i[2][2], 0x00000000);
EXPECT_EQ(out.i[2][3], 0x00000000);
EXPECT_EQ(out.i[3][0], 0x0E060D05);
EXPECT_EQ(out.i[3][1], 0x10080F07);
EXPECT_EQ(out.i[3][2], 0x00000000);
EXPECT_EQ(out.i[3][3], 0x00000000);
for(int i = 0; i < 256; i++)
{
EXPECT_EQ(out.i[4 + i / 2][0 + (i % 2) * 2] & 0xFFFF,
((i >> 0) & 0x03) + 1);
EXPECT_EQ(out.i[4 + i / 2][0 + (i % 2) * 2] >> 16,
((i >> 2) & 0x03) + 1);
EXPECT_EQ(out.i[4 + i / 2][1 + (i % 2) * 2] & 0xFFFF,
((i >> 4) & 0x03) + 1);
EXPECT_EQ(out.i[4 + i / 2][1 + (i % 2) * 2] >> 16,
((i >> 6) & 0x03) + 1);
}
for(int i = 0; i < 256; i++)
{
EXPECT_EQ(out.i[132 + i][0], ((i >> 0) & 0x03) + 1);
EXPECT_EQ(out.i[132 + i][1], ((i >> 2) & 0x03) + 1);
EXPECT_EQ(out.i[132 + i][2], ((i >> 4) & 0x03) + 1);
EXPECT_EQ(out.i[132 + i][3], ((i >> 6) & 0x03) + 1);
}
}
TEST(ReactorUnitTests, Swizzle)
{
FunctionT<void(void *)> function;
{
Pointer<Byte> out = function.Arg<0>();
Int4 c = Int4(0x01020304, 0x05060708, 0x09101112, 0x13141516);
*Pointer<Byte16>(out + 16 * 0) = Swizzle(As<Byte16>(c), 0xFEDCBA9876543210ull);
*Pointer<Byte8>(out + 16 * 1) = Swizzle(As<Byte8>(c), 0x76543210u);
*Pointer<UShort8>(out + 16 * 2) = Swizzle(As<UShort8>(c), 0x76543210u);
}
auto routine = function("one");
int out[3][4];
memset(&out, 0, sizeof(out));
routine(&out);
EXPECT_EQ(out[0][0], 0x16151413);
EXPECT_EQ(out[0][1], 0x12111009);
EXPECT_EQ(out[0][2], 0x08070605);
EXPECT_EQ(out[0][3], 0x04030201);
EXPECT_EQ(out[1][0], 0x08070605);
EXPECT_EQ(out[1][1], 0x04030201);
EXPECT_EQ(out[2][0], 0x15161314);
EXPECT_EQ(out[2][1], 0x11120910);
EXPECT_EQ(out[2][2], 0x07080506);
EXPECT_EQ(out[2][3], 0x03040102);
}
TEST(ReactorUnitTests, Shuffle)
{
// |select| is [0aaa:0bbb:0ccc:0ddd] where |aaa|, |bbb|, |ccc|
// and |ddd| are 7-bit selection indices. For a total (1 << 12)
// possibilities.
const int kSelectRange = 1 << 12;
// Unfortunately, testing the whole kSelectRange results in a test
// that is far too slow to run, because LLVM spends exponentially more
// time optimizing the function below as the number of test cases
// increases.
//
// To work-around the problem, only test a subset of the range by
// skipping every kRangeIncrement value.
//
// Set this value to 1 if you want to test the whole implementation,
// which will take a little less than 2 minutes on a fast workstation.
//
// The default value here takes about 1390ms, which is a little more than
// what the Swizzle test takes (993 ms) on my machine. A non-power-of-2
// value ensures a better spread over possible values.
const int kRangeIncrement = 11;
auto rangeIndexToSelect = [](int i) {
return static_cast<unsigned short>(
(((i >> 9) & 7) << 0) |
(((i >> 6) & 7) << 4) |
(((i >> 3) & 7) << 8) |
(((i >> 0) & 7) << 12));
};
FunctionT<int(void *)> function;
{
Pointer<Byte> out = function.Arg<0>();
for(int i = 0; i < kSelectRange; i += kRangeIncrement)
{
unsigned short select = rangeIndexToSelect(i);
*Pointer<Float4>(out + 16 * i) = Shuffle(Float4(1.0f, 2.0f, 3.0f, 4.0f),
Float4(5.0f, 6.0f, 7.0f, 8.0f),
select);
*Pointer<Int4>(out + (kSelectRange + i) * 16) = Shuffle(Int4(10, 11, 12, 13),
Int4(14, 15, 16, 17),
select);
*Pointer<UInt4>(out + (2 * kSelectRange + i) * 16) = Shuffle(UInt4(100, 101, 102, 103),
UInt4(104, 105, 106, 107),
select);
}
Return(0);
}
auto routine = function("one");
struct
{
float f[kSelectRange][4];
int i[kSelectRange][4];
unsigned u[kSelectRange][4];
} out;
memset(&out, 0, sizeof(out));
routine(&out);
for(int i = 0; i < kSelectRange; i += kRangeIncrement)
{
EXPECT_EQ(out.f[i][0], float(1.0f + (i & 7)));
EXPECT_EQ(out.f[i][1], float(1.0f + ((i >> 3) & 7)));
EXPECT_EQ(out.f[i][2], float(1.0f + ((i >> 6) & 7)));
EXPECT_EQ(out.f[i][3], float(1.0f + ((i >> 9) & 7)));
}
for(int i = 0; i < kSelectRange; i += kRangeIncrement)
{
EXPECT_EQ(out.i[i][0], int(10 + (i & 7)));
EXPECT_EQ(out.i[i][1], int(10 + ((i >> 3) & 7)));
EXPECT_EQ(out.i[i][2], int(10 + ((i >> 6) & 7)));
EXPECT_EQ(out.i[i][3], int(10 + ((i >> 9) & 7)));
}
for(int i = 0; i < kSelectRange; i += kRangeIncrement)
{
EXPECT_EQ(out.u[i][0], unsigned(100 + (i & 7)));
EXPECT_EQ(out.u[i][1], unsigned(100 + ((i >> 3) & 7)));
EXPECT_EQ(out.u[i][2], unsigned(100 + ((i >> 6) & 7)));
EXPECT_EQ(out.u[i][3], unsigned(100 + ((i >> 9) & 7)));
}
}
TEST(ReactorUnitTests, Branching)
{
FunctionT<int()> function;
{
Int x = 0;
For(Int i = 0, i < 8, i++)
{
If(i < 2)
{
x += 1;
}
Else If(i < 4)
{
x += 10;
}
Else If(i < 6)
{
x += 100;
}
Else
{
x += 1000;
}
For(Int i = 0, i < 5, i++)
x += 10000;
}
For(Int i = 0, i < 10, i++) for(int i = 0; i < 10; i++)
For(Int i = 0, i < 10, i++)
{
x += 1000000;
}
For(Int i = 0, i < 2, i++)
If(x == 1000402222)
{
If(x != 1000402222)
x += 1000000000;
}
Else
x = -5;
Return(x);
}
auto routine = function("one");
int result = routine();
EXPECT_EQ(result, 1000402222);
}
TEST(ReactorUnitTests, MinMax)
{
FunctionT<int(void *)> function;
{
Pointer<Byte> out = function.Arg<0>();
*Pointer<Float4>(out + 16 * 0) = Min(Float4(1.0f, 0.0f, -0.0f, +0.0f), Float4(0.0f, 1.0f, +0.0f, -0.0f));
*Pointer<Float4>(out + 16 * 1) = Max(Float4(1.0f, 0.0f, -0.0f, +0.0f), Float4(0.0f, 1.0f, +0.0f, -0.0f));
*Pointer<Int4>(out + 16 * 2) = Min(Int4(1, 0, -1, -0), Int4(0, 1, 0, +0));
*Pointer<Int4>(out + 16 * 3) = Max(Int4(1, 0, -1, -0), Int4(0, 1, 0, +0));
*Pointer<UInt4>(out + 16 * 4) = Min(UInt4(1, 0, -1, -0), UInt4(0, 1, 0, +0));
*Pointer<UInt4>(out + 16 * 5) = Max(UInt4(1, 0, -1, -0), UInt4(0, 1, 0, +0));
*Pointer<Short4>(out + 16 * 6) = Min(Short4(1, 0, -1, -0), Short4(0, 1, 0, +0));
*Pointer<Short4>(out + 16 * 7) = Max(Short4(1, 0, -1, -0), Short4(0, 1, 0, +0));
*Pointer<UShort4>(out + 16 * 8) = Min(UShort4(1, 0, -1, -0), UShort4(0, 1, 0, +0));
*Pointer<UShort4>(out + 16 * 9) = Max(UShort4(1, 0, -1, -0), UShort4(0, 1, 0, +0));
Return(0);
}
auto routine = function("one");
unsigned int out[10][4];
memset(&out, 0, sizeof(out));
routine(&out);
EXPECT_EQ(out[0][0], 0x00000000u);
EXPECT_EQ(out[0][1], 0x00000000u);
EXPECT_EQ(out[0][2], 0x00000000u);
EXPECT_EQ(out[0][3], 0x80000000u);
EXPECT_EQ(out[1][0], 0x3F800000u);
EXPECT_EQ(out[1][1], 0x3F800000u);
EXPECT_EQ(out[1][2], 0x00000000u);
EXPECT_EQ(out[1][3], 0x80000000u);
EXPECT_EQ(out[2][0], 0x00000000u);
EXPECT_EQ(out[2][1], 0x00000000u);
EXPECT_EQ(out[2][2], 0xFFFFFFFFu);
EXPECT_EQ(out[2][3], 0x00000000u);
EXPECT_EQ(out[3][0], 0x00000001u);
EXPECT_EQ(out[3][1], 0x00000001u);
EXPECT_EQ(out[3][2], 0x00000000u);
EXPECT_EQ(out[3][3], 0x00000000u);
EXPECT_EQ(out[4][0], 0x00000000u);
EXPECT_EQ(out[4][1], 0x00000000u);
EXPECT_EQ(out[4][2], 0x00000000u);
EXPECT_EQ(out[4][3], 0x00000000u);
EXPECT_EQ(out[5][0], 0x00000001u);
EXPECT_EQ(out[5][1], 0x00000001u);
EXPECT_EQ(out[5][2], 0xFFFFFFFFu);
EXPECT_EQ(out[5][3], 0x00000000u);
EXPECT_EQ(out[6][0], 0x00000000u);
EXPECT_EQ(out[6][1], 0x0000FFFFu);
EXPECT_EQ(out[6][2], 0x00000000u);
EXPECT_EQ(out[6][3], 0x00000000u);
EXPECT_EQ(out[7][0], 0x00010001u);
EXPECT_EQ(out[7][1], 0x00000000u);
EXPECT_EQ(out[7][2], 0x00000000u);
EXPECT_EQ(out[7][3], 0x00000000u);
EXPECT_EQ(out[8][0], 0x00000000u);
EXPECT_EQ(out[8][1], 0x00000000u);
EXPECT_EQ(out[8][2], 0x00000000u);
EXPECT_EQ(out[8][3], 0x00000000u);
EXPECT_EQ(out[9][0], 0x00010001u);
EXPECT_EQ(out[9][1], 0x0000FFFFu);
EXPECT_EQ(out[9][2], 0x00000000u);
EXPECT_EQ(out[9][3], 0x00000000u);
}
TEST(ReactorUnitTests, NotNeg)
{
FunctionT<int(void *)> function;
{
Pointer<Byte> out = function.Arg<0>();
*Pointer<Int>(out + 16 * 0) = ~Int(0x55555555);
*Pointer<Short>(out + 16 * 1) = ~Short(0x5555);
*Pointer<Int4>(out + 16 * 2) = ~Int4(0x55555555, 0xAAAAAAAA, 0x00000000, 0xFFFFFFFF);
*Pointer<Short4>(out + 16 * 3) = ~Short4(0x5555, 0xAAAA, 0x0000, 0xFFFF);
*Pointer<Int>(out + 16 * 4) = -Int(0x55555555);
*Pointer<Short>(out + 16 * 5) = -Short(0x5555);
*Pointer<Int4>(out + 16 * 6) = -Int4(0x55555555, 0xAAAAAAAA, 0x00000000, 0xFFFFFFFF);
*Pointer<Short4>(out + 16 * 7) = -Short4(0x5555, 0xAAAA, 0x0000, 0xFFFF);
*Pointer<Float4>(out + 16 * 8) = -Float4(1.0f, -1.0f, 0.0f, -0.0f);
Return(0);
}
auto routine = function("one");
unsigned int out[10][4];
memset(&out, 0, sizeof(out));
routine(&out);
EXPECT_EQ(out[0][0], 0xAAAAAAAAu);
EXPECT_EQ(out[0][1], 0x00000000u);
EXPECT_EQ(out[0][2], 0x00000000u);
EXPECT_EQ(out[0][3], 0x00000000u);
EXPECT_EQ(out[1][0], 0x0000AAAAu);
EXPECT_EQ(out[1][1], 0x00000000u);
EXPECT_EQ(out[1][2], 0x00000000u);
EXPECT_EQ(out[1][3], 0x00000000u);
EXPECT_EQ(out[2][0], 0xAAAAAAAAu);
EXPECT_EQ(out[2][1], 0x55555555u);
EXPECT_EQ(out[2][2], 0xFFFFFFFFu);
EXPECT_EQ(out[2][3], 0x00000000u);
EXPECT_EQ(out[3][0], 0x5555AAAAu);
EXPECT_EQ(out[3][1], 0x0000FFFFu);
EXPECT_EQ(out[3][2], 0x00000000u);
EXPECT_EQ(out[3][3], 0x00000000u);
EXPECT_EQ(out[4][0], 0xAAAAAAABu);
EXPECT_EQ(out[4][1], 0x00000000u);
EXPECT_EQ(out[4][2], 0x00000000u);
EXPECT_EQ(out[4][3], 0x00000000u);
EXPECT_EQ(out[5][0], 0x0000AAABu);
EXPECT_EQ(out[5][1], 0x00000000u);
EXPECT_EQ(out[5][2], 0x00000000u);
EXPECT_EQ(out[5][3], 0x00000000u);
EXPECT_EQ(out[6][0], 0xAAAAAAABu);
EXPECT_EQ(out[6][1], 0x55555556u);
EXPECT_EQ(out[6][2], 0x00000000u);
EXPECT_EQ(out[6][3], 0x00000001u);
EXPECT_EQ(out[7][0], 0x5556AAABu);
EXPECT_EQ(out[7][1], 0x00010000u);
EXPECT_EQ(out[7][2], 0x00000000u);
EXPECT_EQ(out[7][3], 0x00000000u);
EXPECT_EQ(out[8][0], 0xBF800000u);
EXPECT_EQ(out[8][1], 0x3F800000u);
EXPECT_EQ(out[8][2], 0x80000000u);
EXPECT_EQ(out[8][3], 0x00000000u);
}
TEST(ReactorUnitTests, FPtoUI)
{
FunctionT<int(void *)> function;
{
Pointer<Byte> out = function.Arg<0>();
*Pointer<UInt>(out + 0) = UInt(Float(0xF0000000u));
*Pointer<UInt>(out + 4) = UInt(Float(0xC0000000u));
*Pointer<UInt>(out + 8) = UInt(Float(0x00000001u));
*Pointer<UInt>(out + 12) = UInt(Float(0xF000F000u));
*Pointer<UInt4>(out + 16) = UInt4(Float4(0xF0000000u, 0x80000000u, 0x00000000u, 0xCCCC0000u));
Return(0);
}
auto routine = function("one");
unsigned int out[2][4];
memset(&out, 0, sizeof(out));
routine(&out);
EXPECT_EQ(out[0][0], 0xF0000000u);
EXPECT_EQ(out[0][1], 0xC0000000u);
EXPECT_EQ(out[0][2], 0x00000001u);
EXPECT_EQ(out[0][3], 0xF000F000u);
EXPECT_EQ(out[1][0], 0xF0000000u);
EXPECT_EQ(out[1][1], 0x80000000u);
EXPECT_EQ(out[1][2], 0x00000000u);
EXPECT_EQ(out[1][3], 0xCCCC0000u);
}
TEST(ReactorUnitTests, VectorCompare)
{
FunctionT<int(void *)> function;
{
Pointer<Byte> out = function.Arg<0>();
*Pointer<Int4>(out + 16 * 0) = CmpEQ(Float4(1.0f, 1.0f, -0.0f, +0.0f), Float4(0.0f, 1.0f, +0.0f, -0.0f));
*Pointer<Int4>(out + 16 * 1) = CmpEQ(Int4(1, 0, -1, -0), Int4(0, 1, 0, +0));
*Pointer<Byte8>(out + 16 * 2) = CmpEQ(SByte8(1, 2, 3, 4, 5, 6, 7, 8), SByte8(7, 6, 5, 4, 3, 2, 1, 0));
*Pointer<Int4>(out + 16 * 3) = CmpNLT(Float4(1.0f, 1.0f, -0.0f, +0.0f), Float4(0.0f, 1.0f, +0.0f, -0.0f));
*Pointer<Int4>(out + 16 * 4) = CmpNLT(Int4(1, 0, -1, -0), Int4(0, 1, 0, +0));
*Pointer<Byte8>(out + 16 * 5) = CmpGT(SByte8(1, 2, 3, 4, 5, 6, 7, 8), SByte8(7, 6, 5, 4, 3, 2, 1, 0));
Return(0);
}
auto routine = function("one");
unsigned int out[6][4];
memset(&out, 0, sizeof(out));
routine(&out);
EXPECT_EQ(out[0][0], 0x00000000u);
EXPECT_EQ(out[0][1], 0xFFFFFFFFu);
EXPECT_EQ(out[0][2], 0xFFFFFFFFu);
EXPECT_EQ(out[0][3], 0xFFFFFFFFu);
EXPECT_EQ(out[1][0], 0x00000000u);
EXPECT_EQ(out[1][1], 0x00000000u);
EXPECT_EQ(out[1][2], 0x00000000u);
EXPECT_EQ(out[1][3], 0xFFFFFFFFu);
EXPECT_EQ(out[2][0], 0xFF000000u);
EXPECT_EQ(out[2][1], 0x00000000u);
EXPECT_EQ(out[3][0], 0xFFFFFFFFu);
EXPECT_EQ(out[3][1], 0xFFFFFFFFu);
EXPECT_EQ(out[3][2], 0xFFFFFFFFu);
EXPECT_EQ(out[3][3], 0xFFFFFFFFu);
EXPECT_EQ(out[4][0], 0xFFFFFFFFu);
EXPECT_EQ(out[4][1], 0x00000000u);
EXPECT_EQ(out[4][2], 0x00000000u);
EXPECT_EQ(out[4][3], 0xFFFFFFFFu);
EXPECT_EQ(out[5][0], 0x00000000u);
EXPECT_EQ(out[5][1], 0xFFFFFFFFu);
}
TEST(ReactorUnitTests, SaturatedAddAndSubtract)
{
FunctionT<int(void *)> function;
{
Pointer<Byte> out = function.Arg<0>();
*Pointer<Byte8>(out + 8 * 0) =
AddSat(Byte8(1, 2, 3, 4, 5, 6, 7, 8),
Byte8(7, 6, 5, 4, 3, 2, 1, 0));
*Pointer<Byte8>(out + 8 * 1) =
AddSat(Byte8(0xFE, 0xFE, 0xFE, 0xFE, 0xFE, 0xFE, 0xFE, 0xFE),
Byte8(7, 6, 5, 4, 3, 2, 1, 0));
*Pointer<Byte8>(out + 8 * 2) =
SubSat(Byte8(1, 2, 3, 4, 5, 6, 7, 8),
Byte8(7, 6, 5, 4, 3, 2, 1, 0));
*Pointer<SByte8>(out + 8 * 3) =
AddSat(SByte8(1, 2, 3, 4, 5, 6, 7, 8),
SByte8(7, 6, 5, 4, 3, 2, 1, 0));
*Pointer<SByte8>(out + 8 * 4) =
AddSat(SByte8(0x7E, 0x7E, 0x7E, 0x7E, 0x7E, 0x7E, 0x7E, 0x7E),
SByte8(7, 6, 5, 4, 3, 2, 1, 0));
*Pointer<SByte8>(out + 8 * 5) =
AddSat(SByte8(0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87, 0x88),
SByte8(-7, -6, -5, -4, -3, -2, -1, -0));
*Pointer<SByte8>(out + 8 * 6) =
SubSat(SByte8(0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87, 0x88),
SByte8(7, 6, 5, 4, 3, 2, 1, 0));
*Pointer<Short4>(out + 8 * 7) =
AddSat(Short4(1, 2, 3, 4), Short4(3, 2, 1, 0));
*Pointer<Short4>(out + 8 * 8) =
AddSat(Short4(0x7FFE, 0x7FFE, 0x7FFE, 0x7FFE),
Short4(3, 2, 1, 0));
*Pointer<Short4>(out + 8 * 9) =
AddSat(Short4(0x8001, 0x8002, 0x8003, 0x8004),
Short4(-3, -2, -1, -0));
*Pointer<Short4>(out + 8 * 10) =
SubSat(Short4(0x8001, 0x8002, 0x8003, 0x8004),
Short4(3, 2, 1, 0));
*Pointer<UShort4>(out + 8 * 11) =
AddSat(UShort4(1, 2, 3, 4), UShort4(3, 2, 1, 0));
*Pointer<UShort4>(out + 8 * 12) =
AddSat(UShort4(0xFFFE, 0xFFFE, 0xFFFE, 0xFFFE),
UShort4(3, 2, 1, 0));
*Pointer<UShort4>(out + 8 * 13) =
SubSat(UShort4(1, 2, 3, 4), UShort4(3, 2, 1, 0));
Return(0);
}
auto routine = function("one");
unsigned int out[14][2];
memset(&out, 0, sizeof(out));
routine(&out);
EXPECT_EQ(out[0][0], 0x08080808u);
EXPECT_EQ(out[0][1], 0x08080808u);
EXPECT_EQ(out[1][0], 0xFFFFFFFFu);
EXPECT_EQ(out[1][1], 0xFEFFFFFFu);
EXPECT_EQ(out[2][0], 0x00000000u);
EXPECT_EQ(out[2][1], 0x08060402u);
EXPECT_EQ(out[3][0], 0x08080808u);
EXPECT_EQ(out[3][1], 0x08080808u);
EXPECT_EQ(out[4][0], 0x7F7F7F7Fu);
EXPECT_EQ(out[4][1], 0x7E7F7F7Fu);
EXPECT_EQ(out[5][0], 0x80808080u);
EXPECT_EQ(out[5][1], 0x88868482u);
EXPECT_EQ(out[6][0], 0x80808080u);
EXPECT_EQ(out[6][1], 0x88868482u);
EXPECT_EQ(out[7][0], 0x00040004u);
EXPECT_EQ(out[7][1], 0x00040004u);
EXPECT_EQ(out[8][0], 0x7FFF7FFFu);
EXPECT_EQ(out[8][1], 0x7FFE7FFFu);
EXPECT_EQ(out[9][0], 0x80008000u);
EXPECT_EQ(out[9][1], 0x80048002u);
EXPECT_EQ(out[10][0], 0x80008000u);
EXPECT_EQ(out[10][1], 0x80048002u);
EXPECT_EQ(out[11][0], 0x00040004u);
EXPECT_EQ(out[11][1], 0x00040004u);
EXPECT_EQ(out[12][0], 0xFFFFFFFFu);
EXPECT_EQ(out[12][1], 0xFFFEFFFFu);
EXPECT_EQ(out[13][0], 0x00000000u);
EXPECT_EQ(out[13][1], 0x00040002u);
}
TEST(ReactorUnitTests, Unpack)
{
FunctionT<int(void *, void *)> function;
{
Pointer<Byte> in = function.Arg<0>();
Pointer<Byte> out = function.Arg<1>();
Byte4 test_byte_a = *Pointer<Byte4>(in + 4 * 0);
Byte4 test_byte_b = *Pointer<Byte4>(in + 4 * 1);
*Pointer<Short4>(out + 8 * 0) =
Unpack(test_byte_a, test_byte_b);
*Pointer<Short4>(out + 8 * 1) = Unpack(test_byte_a);
Return(0);
}
auto routine = function("one");
unsigned int in[1][2];
unsigned int out[2][2];
memset(&out, 0, sizeof(out));
in[0][0] = 0xABCDEF12u;
in[0][1] = 0x34567890u;
routine(&in, &out);
EXPECT_EQ(out[0][0], 0x78EF9012u);
EXPECT_EQ(out[0][1], 0x34AB56CDu);
EXPECT_EQ(out[1][0], 0xEFEF1212u);
EXPECT_EQ(out[1][1], 0xABABCDCDu);
}
TEST(ReactorUnitTests, Pack)
{
FunctionT<int(void *)> function;
{
Pointer<Byte> out = function.Arg<0>();
*Pointer<SByte8>(out + 8 * 0) =
PackSigned(Short4(-1, -2, 1, 2),
Short4(3, 4, -3, -4));
*Pointer<Byte8>(out + 8 * 1) =
PackUnsigned(Short4(-1, -2, 1, 2),
Short4(3, 4, -3, -4));
*Pointer<Short8>(out + 8 * 2) =
PackSigned(Int4(-1, -2, 1, 2),
Int4(3, 4, -3, -4));
*Pointer<UShort8>(out + 8 * 4) =
PackUnsigned(Int4(-1, -2, 1, 2),
Int4(3, 4, -3, -4));
Return(0);
}
auto routine = function("one");
unsigned int out[6][2];
memset(&out, 0, sizeof(out));
routine(&out);
EXPECT_EQ(out[0][0], 0x0201FEFFu);
EXPECT_EQ(out[0][1], 0xFCFD0403u);
EXPECT_EQ(out[1][0], 0x02010000u);
EXPECT_EQ(out[1][1], 0x00000403u);
EXPECT_EQ(out[2][0], 0xFFFEFFFFu);
EXPECT_EQ(out[2][1], 0x00020001u);
EXPECT_EQ(out[3][0], 0x00040003u);
EXPECT_EQ(out[3][1], 0xFFFCFFFDu);
EXPECT_EQ(out[4][0], 0x00000000u);
EXPECT_EQ(out[4][1], 0x00020001u);
EXPECT_EQ(out[5][0], 0x00040003u);
EXPECT_EQ(out[5][1], 0x00000000u);
}
TEST(ReactorUnitTests, MulHigh)
{
FunctionT<int(void *)> function;
{
Pointer<Byte> out = function.Arg<0>();
*Pointer<Short4>(out + 16 * 0) =
MulHigh(Short4(0x01AA, 0x02DD, 0x03EE, 0xF422),
Short4(0x01BB, 0x02CC, 0x03FF, 0xF411));
*Pointer<UShort4>(out + 16 * 1) =
MulHigh(UShort4(0x01AA, 0x02DD, 0x03EE, 0xF422),
UShort4(0x01BB, 0x02CC, 0x03FF, 0xF411));
*Pointer<Int4>(out + 16 * 2) =
MulHigh(Int4(0x000001AA, 0x000002DD, 0xC8000000, 0xF8000000),
Int4(0x000001BB, 0x84000000, 0x000003EE, 0xD7000000));
*Pointer<UInt4>(out + 16 * 3) =
MulHigh(UInt4(0x000001AAu, 0x000002DDu, 0xC8000000u, 0xD8000000u),
UInt4(0x000001BBu, 0x84000000u, 0x000003EEu, 0xD7000000u));
*Pointer<Int4>(out + 16 * 4) =
MulHigh(Int4(0x7FFFFFFF, 0x7FFFFFFF, 0x80008000, 0xFFFFFFFF),
Int4(0x7FFFFFFF, 0x80000000, 0x80008000, 0xFFFFFFFF));
*Pointer<UInt4>(out + 16 * 5) =
MulHigh(UInt4(0x7FFFFFFFu, 0x7FFFFFFFu, 0x80008000u, 0xFFFFFFFFu),
UInt4(0x7FFFFFFFu, 0x80000000u, 0x80008000u, 0xFFFFFFFFu));
// (U)Short8 variants currently unimplemented.
Return(0);
}
auto routine = function("one");
unsigned int out[6][4];
memset(&out, 0, sizeof(out));
routine(&out);
EXPECT_EQ(out[0][0], 0x00080002u);
EXPECT_EQ(out[0][1], 0x008D000Fu);
EXPECT_EQ(out[1][0], 0x00080002u);
EXPECT_EQ(out[1][1], 0xE8C0000Fu);
EXPECT_EQ(out[2][0], 0x00000000u);
EXPECT_EQ(out[2][1], 0xFFFFFE9Cu);
EXPECT_EQ(out[2][2], 0xFFFFFF23u);
EXPECT_EQ(out[2][3], 0x01480000u);
EXPECT_EQ(out[3][0], 0x00000000u);
EXPECT_EQ(out[3][1], 0x00000179u);
EXPECT_EQ(out[3][2], 0x00000311u);
EXPECT_EQ(out[3][3], 0xB5680000u);
EXPECT_EQ(out[4][0], 0x3FFFFFFFu);
EXPECT_EQ(out[4][1], 0xC0000000u);
EXPECT_EQ(out[4][2], 0x3FFF8000u);
EXPECT_EQ(out[4][3], 0x00000000u);
EXPECT_EQ(out[5][0], 0x3FFFFFFFu);
EXPECT_EQ(out[5][1], 0x3FFFFFFFu);
EXPECT_EQ(out[5][2], 0x40008000u);
EXPECT_EQ(out[5][3], 0xFFFFFFFEu);
}
TEST(ReactorUnitTests, MulAdd)
{
FunctionT<int(void *)> function;
{
Pointer<Byte> out = function.Arg<0>();
*Pointer<Int2>(out + 8 * 0) =
MulAdd(Short4(0x1aa, 0x2dd, 0x3ee, 0xF422),
Short4(0x1bb, 0x2cc, 0x3ff, 0xF411));
// (U)Short8 variant is mentioned but unimplemented
Return(0);
}
auto routine = function("one");
unsigned int out[1][2];
memset(&out, 0, sizeof(out));
routine(&out);
EXPECT_EQ(out[0][0], 0x000AE34Au);
EXPECT_EQ(out[0][1], 0x009D5254u);
}
TEST(ReactorUnitTests, PointersEqual)
{
FunctionT<int(void *, void *)> function;
{
Pointer<Byte> ptrA = function.Arg<0>();
Pointer<Byte> ptrB = function.Arg<1>();
If(ptrA == ptrB)
{
Return(1);
}
Else
{
Return(0);
}
}
auto routine = function("one");
int *a = reinterpret_cast<int *>(uintptr_t(0x0000000000000000));
int *b = reinterpret_cast<int *>(uintptr_t(0x00000000F0000000));
int *c = reinterpret_cast<int *>(uintptr_t(0xF000000000000000));
EXPECT_EQ(routine(&a, &a), 1);
EXPECT_EQ(routine(&b, &b), 1);
EXPECT_EQ(routine(&c, &c), 1);
EXPECT_EQ(routine(&a, &b), 0);
EXPECT_EQ(routine(&b, &a), 0);
EXPECT_EQ(routine(&b, &c), 0);
EXPECT_EQ(routine(&c, &b), 0);
EXPECT_EQ(routine(&c, &a), 0);
EXPECT_EQ(routine(&a, &c), 0);
}
TEST(ReactorUnitTests, Args_2Mixed)
{
// 2 mixed type args
FunctionT<float(int, float)> function;
{
Int a = function.Arg<0>();
Float b = function.Arg<1>();
Return(Float(a) + b);
}
if(auto routine = function("one"))
{
float result = routine(1, 2.f);
EXPECT_EQ(result, 3.f);
}
}
TEST(ReactorUnitTests, Args_4Mixed)
{
// 4 mixed type args (max register allocation on Windows)
FunctionT<float(int, float, int, float)> function;
{
Int a = function.Arg<0>();
Float b = function.Arg<1>();
Int c = function.Arg<2>();
Float d = function.Arg<3>();
Return(Float(a) + b + Float(c) + d);
}
if(auto routine = function("one"))
{
float result = routine(1, 2.f, 3, 4.f);
EXPECT_EQ(result, 10.f);
}
}
TEST(ReactorUnitTests, Args_5Mixed)
{
// 5 mixed type args (5th spills over to stack on Windows)
FunctionT<float(int, float, int, float, int)> function;
{
Int a = function.Arg<0>();
Float b = function.Arg<1>();
Int c = function.Arg<2>();
Float d = function.Arg<3>();
Int e = function.Arg<4>();
Return(Float(a) + b + Float(c) + d + Float(e));
}
if(auto routine = function("one"))
{
float result = routine(1, 2.f, 3, 4.f, 5);
EXPECT_EQ(result, 15.f);
}
}
TEST(ReactorUnitTests, Args_GreaterThan5Mixed)
{
// >5 mixed type args
FunctionT<float(int, float, int, float, int, float, int, float, int, float)> function;
{
Int a = function.Arg<0>();
Float b = function.Arg<1>();
Int c = function.Arg<2>();
Float d = function.Arg<3>();
Int e = function.Arg<4>();
Float f = function.Arg<5>();
Int g = function.Arg<6>();
Float h = function.Arg<7>();
Int i = function.Arg<8>();
Float j = function.Arg<9>();
Return(Float(a) + b + Float(c) + d + Float(e) + f + Float(g) + h + Float(i) + j);
}
if(auto routine = function("one"))
{
float result = routine(1, 2.f, 3, 4.f, 5, 6.f, 7, 8.f, 9, 10.f);
EXPECT_EQ(result, 55.f);
}
}
// This test was written because on Windows with Subzero, we would get a crash when executing a function
// with a large number of local variables. The problem was that on Windows, 4K pages are allocated as
// needed for the stack whenever an access is made in a "guard page", at which point the page is committed,
// and the next 4K page becomes the guard page. If a stack access is made that's beyond the guard page,
// a regular page fault occurs. To fix this, Subzero (and any compiler) now emits a call to __chkstk with
// the stack size in EAX, so that it can probe the stack in 4K increments up to that size, committing the
// required pages. See https://docs.microsoft.com/en-us/windows/win32/devnotes/-win32-chkstk.
TEST(ReactorUnitTests, LargeStack)
{
#if defined(_WIN32)
// An empirically large enough value to access outside the guard pages
constexpr int ArrayByteSize = 24 * 1024;
constexpr int ArraySize = ArrayByteSize / sizeof(int32_t);
FunctionT<void(int32_t * v)> function;
{
// Allocate a stack array large enough that writing to the first element will reach beyond
// the guard page.
Array<Int, ArraySize> largeStackArray;
for(int i = 0; i < ArraySize; ++i)
{
largeStackArray[i] = i;
}
Pointer<Int> in = function.Arg<0>();
for(int i = 0; i < ArraySize; ++i)
{
in[i] = largeStackArray[i];
}
}
auto routine = function("one");
std::array<int32_t, ArraySize> v;
// Run this in a thread, so that we get the default reserved stack size (8K on Win64).
std::thread t([&] {
routine(v.data());
});
t.join();
for(int i = 0; i < ArraySize; ++i)
{
EXPECT_EQ(v[i], i);
}
#endif
}
TEST(ReactorUnitTests, Call)
{
struct Class
{
static int Callback(Class *p, int i, float f)
{
p->i = i;
p->f = f;
return i + int(f);
}
int i = 0;
float f = 0.0f;
};
FunctionT<int(void *)> function;
{
Pointer<Byte> c = function.Arg<0>();
auto res = Call(Class::Callback, c, 10, 20.0f);
Return(res);
}
auto routine = function("one");
Class c;
int res = routine(&c);
EXPECT_EQ(res, 30);
EXPECT_EQ(c.i, 10);
EXPECT_EQ(c.f, 20.0f);
}
TEST(ReactorUnitTests, CallMemberFunction)
{
struct Class
{
int Callback(int argI, float argF)
{
i = argI;
f = argF;
return i + int(f);
}
int i = 0;
float f = 0.0f;
};
Class c;
FunctionT<int()> function;
{
auto res = Call(&Class::Callback, &c, 10, 20.0f);
Return(res);
}
auto routine = function("one");
int res = routine();
EXPECT_EQ(res, 30);
EXPECT_EQ(c.i, 10);
EXPECT_EQ(c.f, 20.0f);
}
TEST(ReactorUnitTests, CallMemberFunctionIndirect)
{
struct Class
{
int Callback(int argI, float argF)
{
i = argI;
f = argF;
return i + int(f);
}
int i = 0;
float f = 0.0f;
};
FunctionT<int(void *)> function;
{
Pointer<Byte> c = function.Arg<0>();
auto res = Call(&Class::Callback, c, 10, 20.0f);
Return(res);
}
auto routine = function("one");
Class c;
int res = routine(&c);
EXPECT_EQ(res, 30);
EXPECT_EQ(c.i, 10);
EXPECT_EQ(c.f, 20.0f);
}
TEST(ReactorUnitTests, CallImplicitCast)
{
struct Class
{
static void Callback(Class *c, const char *s)
{
c->str = s;
}
std::string str;
};
FunctionT<void(Class * c, const char *s)> function;
{
Pointer<Byte> c = function.Arg<0>();
Pointer<Byte> s = function.Arg<1>();
Call(Class::Callback, c, s);
}
auto routine = function("one");
Class c;
routine(&c, "hello world");
EXPECT_EQ(c.str, "hello world");
}
TEST(ReactorUnitTests, CallBoolReturnFunction)
{
struct Class
{
static bool IsEven(int a)
{
return a % 2 == 0;
}
};
FunctionT<int(int)> function;
{
Int a = function.Arg<0>();
Bool res = Call(Class::IsEven, a);
If(res)
{
Return(1);
}
Return(0);
}
auto routine = function("one");
for(int i = 0; i < 10; ++i)
{
EXPECT_EQ(routine(i), i % 2 == 0);
}
}
TEST(ReactorUnitTests, Call_Args4)
{
struct Class
{
static int Func(int a, int b, int c, int d)
{
return a + b + c + d;
}
};
{
FunctionT<int()> function;
{
auto res = Call(Class::Func, 1, 2, 3, 4);
Return(res);
}
auto routine = function("one");
int res = routine();
EXPECT_EQ(res, 1 + 2 + 3 + 4);
}
}
TEST(ReactorUnitTests, Call_Args5)
{
struct Class
{
static int Func(int a, int b, int c, int d, int e)
{
return a + b + c + d + e;
}
};
{
FunctionT<int()> function;
{
auto res = Call(Class::Func, 1, 2, 3, 4, 5);
Return(res);
}
auto routine = function("one");
int res = routine();
EXPECT_EQ(res, 1 + 2 + 3 + 4 + 5);
}
}
TEST(ReactorUnitTests, Call_ArgsMany)
{
struct Class
{
static int Func(int a, int b, int c, int d, int e, int f, int g, int h)
{
return a + b + c + d + e + f + g + h;
}
};
{
FunctionT<int()> function;
{
auto res = Call(Class::Func, 1, 2, 3, 4, 5, 6, 7, 8);
Return(res);
}
auto routine = function("one");
int res = routine();
EXPECT_EQ(res, 1 + 2 + 3 + 4 + 5 + 6 + 7 + 8);
}
}
TEST(ReactorUnitTests, Call_ArgsMixed)
{
struct Class
{
static int Func(int a, float b, int *c, float *d, int e, float f, int *g, float *h)
{
return a + b + *c + *d + e + f + *g + *h;
}
};
{
FunctionT<int()> function;
{
Int c(3);
Float d(4);
Int g(7);
Float h(8);
auto res = Call(Class::Func, 1, 2.f, &c, &d, 5, 6.f, &g, &h);
Return(res);
}
auto routine = function("one");
int res = routine();
EXPECT_EQ(res, 1 + 2 + 3 + 4 + 5 + 6 + 7 + 8);
}
}
TEST(ReactorUnitTests, Call_ArgsPointer)
{
struct Class
{
static int Func(int *a)
{
return *a;
}
};
{
FunctionT<int()> function;
{
Int a(12345);
auto res = Call(Class::Func, &a);
Return(res);
}
auto routine = function("one");
int res = routine();
EXPECT_EQ(res, 12345);
}
}
TEST(ReactorUnitTests, CallExternalCallRoutine)
{
// routine1 calls Class::Func, passing it a pointer to routine2, and Class::Func calls routine2
auto routine2 = [] {
FunctionT<float(float, int)> function;
{
Float a = function.Arg<0>();
Int b = function.Arg<1>();
Return(a + Float(b));
}
return function("two");
}();
struct Class
{
static float Func(void *p, float a, int b)
{
auto funcToCall = reinterpret_cast<float (*)(float, int)>(p);
return funcToCall(a, b);
}
};
auto routine1 = [] {
FunctionT<float(void *, float, int)> function;
{
Pointer<Byte> funcToCall = function.Arg<0>();
Float a = function.Arg<1>();
Int b = function.Arg<2>();
Float result = Call(Class::Func, funcToCall, a, b);
Return(result);
}
return function("one");
}();
float result = routine1((void *)routine2.getEntry(), 12.f, 13);
EXPECT_EQ(result, 25.f);
}
// Check that a complex generated function which utilizes all 8 or 16 XMM
// registers computes the correct result.
// (Note that due to MSC's lack of support for inline assembly in x64,
// this test does not actually check that the register contents are
// preserved, just that the generated function computes the correct value.
// It's necessary to inspect the registers in a debugger to actually verify.)
TEST(ReactorUnitTests, PreserveXMMRegisters)
{
FunctionT<void(void *, void *)> function;
{
Pointer<Byte> in = function.Arg<0>();
Pointer<Byte> out = function.Arg<1>();
Float4 a = *Pointer<Float4>(in + 16 * 0);
Float4 b = *Pointer<Float4>(in + 16 * 1);
Float4 c = *Pointer<Float4>(in + 16 * 2);
Float4 d = *Pointer<Float4>(in + 16 * 3);
Float4 e = *Pointer<Float4>(in + 16 * 4);
Float4 f = *Pointer<Float4>(in + 16 * 5);
Float4 g = *Pointer<Float4>(in + 16 * 6);
Float4 h = *Pointer<Float4>(in + 16 * 7);
Float4 i = *Pointer<Float4>(in + 16 * 8);
Float4 j = *Pointer<Float4>(in + 16 * 9);
Float4 k = *Pointer<Float4>(in + 16 * 10);
Float4 l = *Pointer<Float4>(in + 16 * 11);
Float4 m = *Pointer<Float4>(in + 16 * 12);
Float4 n = *Pointer<Float4>(in + 16 * 13);
Float4 o = *Pointer<Float4>(in + 16 * 14);
Float4 p = *Pointer<Float4>(in + 16 * 15);
Float4 ab = a + b;
Float4 cd = c + d;
Float4 ef = e + f;
Float4 gh = g + h;
Float4 ij = i + j;
Float4 kl = k + l;
Float4 mn = m + n;
Float4 op = o + p;
Float4 abcd = ab + cd;
Float4 efgh = ef + gh;
Float4 ijkl = ij + kl;
Float4 mnop = mn + op;
Float4 abcdefgh = abcd + efgh;
Float4 ijklmnop = ijkl + mnop;
Float4 sum = abcdefgh + ijklmnop;
*Pointer<Float4>(out) = sum;
Return();
}
auto routine = function("one");
assert(routine);
float input[64] = { 1.0f, 0.0f, 0.0f, 0.0f,
-1.0f, 1.0f, -1.0f, 0.0f,
1.0f, 2.0f, -2.0f, 0.0f,
-1.0f, 3.0f, -3.0f, 0.0f,
1.0f, 4.0f, -4.0f, 0.0f,
-1.0f, 5.0f, -5.0f, 0.0f,
1.0f, 6.0f, -6.0f, 0.0f,
-1.0f, 7.0f, -7.0f, 0.0f,
1.0f, 8.0f, -8.0f, 0.0f,
-1.0f, 9.0f, -9.0f, 0.0f,
1.0f, 10.0f, -10.0f, 0.0f,
-1.0f, 11.0f, -11.0f, 0.0f,
1.0f, 12.0f, -12.0f, 0.0f,
-1.0f, 13.0f, -13.0f, 0.0f,
1.0f, 14.0f, -14.0f, 0.0f,
-1.0f, 15.0f, -15.0f, 0.0f };
float result[4];
routine(input, result);
EXPECT_EQ(result[0], 0.0f);
EXPECT_EQ(result[1], 120.0f);
EXPECT_EQ(result[2], -120.0f);
EXPECT_EQ(result[3], 0.0f);
}
template<typename T>
class CToReactorTCastTest : public ::testing::Test
{
public:
using CType = typename std::tuple_element<0, T>::type;
using ReactorType = typename std::tuple_element<1, T>::type;
};
using CToReactorTCastTestTypes = ::testing::Types< // Subset of types that can be used as arguments.
// std::pair<bool, Bool>, FIXME(capn): Not supported as argument type by Subzero.
// std::pair<uint8_t, Byte>, FIXME(capn): Not supported as argument type by Subzero.
// std::pair<int8_t, SByte>, FIXME(capn): Not supported as argument type by Subzero.
// std::pair<int16_t, Short>, FIXME(capn): Not supported as argument type by Subzero.
// std::pair<uint16_t, UShort>, FIXME(capn): Not supported as argument type by Subzero.
std::pair<int, Int>,
std::pair<unsigned int, UInt>,
std::pair<float, Float>>;
TYPED_TEST_SUITE(CToReactorTCastTest, CToReactorTCastTestTypes);
TYPED_TEST(CToReactorTCastTest, Casts)
{
using CType = typename TestFixture::CType;
using ReactorType = typename TestFixture::ReactorType;
std::shared_ptr<Routine> routine;
{
Function<Int(ReactorType)> function;
{
ReactorType a = function.template Arg<0>();
ReactorType b = CType{};
RValue<ReactorType> c = RValue<ReactorType>(CType{});
Bool same = (a == b) && (a == c);
Return(IfThenElse(same, Int(1), Int(0))); // TODO: Ability to use Bools as return values.
}
routine = function("one");
auto callable = (int (*)(CType))routine->getEntry();
CType in = {};
EXPECT_EQ(callable(in), 1);
}
}
template<typename T>
class GEPTest : public ::testing::Test
{
public:
using CType = typename std::tuple_element<0, T>::type;
using ReactorType = typename std::tuple_element<1, T>::type;
};
using GEPTestTypes = ::testing::Types<
std::pair<bool, Bool>,
std::pair<int8_t, Byte>,
std::pair<int8_t, SByte>,
std::pair<int8_t[4], Byte4>,
std::pair<int8_t[4], SByte4>,
std::pair<int8_t[8], Byte8>,
std::pair<int8_t[8], SByte8>,
std::pair<int8_t[16], Byte16>,
std::pair<int8_t[16], SByte16>,
std::pair<int16_t, Short>,
std::pair<int16_t, UShort>,
std::pair<int16_t[2], Short2>,
std::pair<int16_t[2], UShort2>,
std::pair<int16_t[4], Short4>,
std::pair<int16_t[4], UShort4>,
std::pair<int16_t[8], Short8>,
std::pair<int16_t[8], UShort8>,
std::pair<int, Int>,
std::pair<int, UInt>,
std::pair<int[2], Int2>,
std::pair<int[2], UInt2>,
std::pair<int[4], Int4>,
std::pair<int[4], UInt4>,
std::pair<int64_t, Long>,
std::pair<int16_t, Half>,
std::pair<float, Float>,
std::pair<float[2], Float2>,
std::pair<float[4], Float4>>;
TYPED_TEST_SUITE(GEPTest, GEPTestTypes);
TYPED_TEST(GEPTest, PtrOffsets)
{
using CType = typename TestFixture::CType;
using ReactorType = typename TestFixture::ReactorType;
std::shared_ptr<Routine> routine;
{
Function<Pointer<ReactorType>(Pointer<ReactorType>, Int)> function;
{
Pointer<ReactorType> pointer = function.template Arg<0>();
Int index = function.template Arg<1>();
Return(&pointer[index]);
}
routine = function("one");
auto callable = (CType * (*)(CType *, unsigned int)) routine->getEntry();
union PtrInt
{
CType *p;
size_t i;
};
PtrInt base;
base.i = 0x10000;
for(int i = 0; i < 5; i++)
{
PtrInt reference;
reference.p = &base.p[i];
PtrInt result;
result.p = callable(base.p, i);
auto expect = reference.i - base.i;
auto got = result.i - base.i;
EXPECT_EQ(got, expect) << "i:" << i;
}
}
}
static const std::vector<int> fibonacci = {
0,
1,
1,
2,
3,
5,
8,
13,
21,
34,
55,
89,
144,
233,
377,
610,
987,
1597,
2584,
4181,
6765,
10946,
17711,
28657,
46368,
75025,
121393,
196418,
317811,
};
TEST(ReactorUnitTests, Fibonacci)
{
FunctionT<int(int)> function;
{
Int n = function.Arg<0>();
Int current = 0;
Int next = 1;
For(Int i = 0, i < n, i++)
{
auto tmp = current + next;
current = next;
next = tmp;
}
Return(current);
}
auto routine = function("one");
for(size_t i = 0; i < fibonacci.size(); i++)
{
EXPECT_EQ(routine(i), fibonacci[i]);
}
}
TEST(ReactorUnitTests, Coroutines_Fibonacci)
{
if(!rr::Caps.CoroutinesSupported)
{
SUCCEED() << "Coroutines not supported";
return;
}
Coroutine<int()> function;
{
Yield(Int(0));
Yield(Int(1));
Int current = 1;
Int next = 1;
While(true)
{
Yield(next);
auto tmp = current + next;
current = next;
next = tmp;
}
}
auto coroutine = function();
for(size_t i = 0; i < fibonacci.size(); i++)
{
int out = 0;
EXPECT_EQ(coroutine->await(out), true);
EXPECT_EQ(out, fibonacci[i]);
}
}
TEST(ReactorUnitTests, Coroutines_Parameters)
{
if(!rr::Caps.CoroutinesSupported)
{
SUCCEED() << "Coroutines not supported";
return;
}
Coroutine<uint8_t(uint8_t * data, int count)> function;
{
Pointer<Byte> data = function.Arg<0>();
Int count = function.Arg<1>();
For(Int i = 0, i < count, i++)
{
Yield(data[i]);
}
}
uint8_t data[] = { 10, 20, 30 };
auto coroutine = function(&data[0], 3);
uint8_t out = 0;
EXPECT_EQ(coroutine->await(out), true);
EXPECT_EQ(out, 10);
out = 0;
EXPECT_EQ(coroutine->await(out), true);
EXPECT_EQ(out, 20);
out = 0;
EXPECT_EQ(coroutine->await(out), true);
EXPECT_EQ(out, 30);
out = 99;
EXPECT_EQ(coroutine->await(out), false);
EXPECT_EQ(out, 99);
EXPECT_EQ(coroutine->await(out), false);
EXPECT_EQ(out, 99);
}
// This test was written because Subzero's handling of vector types
// failed when more than one function is generated, as is the case
// with coroutines.
TEST(ReactorUnitTests, Coroutines_Vectors)
{
if(!rr::Caps.CoroutinesSupported)
{
SUCCEED() << "Coroutines not supported";
return;
}
Coroutine<int()> function;
{
Int4 a{ 1, 2, 3, 4 };
Yield(rr::Extract(a, 2));
Int4 b{ 5, 6, 7, 8 };
Yield(rr::Extract(b, 1));
Int4 c{ 9, 10, 11, 12 };
Yield(rr::Extract(c, 1));
}
auto coroutine = function();
int out;
coroutine->await(out);
EXPECT_EQ(out, 3);
coroutine->await(out);
EXPECT_EQ(out, 6);
coroutine->await(out);
EXPECT_EQ(out, 10);
}
// This test was written to make sure a coroutine without a Yield()
// works correctly, by executing like a regular function with no
// return (the return type is ignored).
// We also run it twice to ensure per instance and/or global state
// is properly cleaned up in between.
TEST(ReactorUnitTests, Coroutines_NoYield)
{
if(!rr::Caps.CoroutinesSupported)
{
SUCCEED() << "Coroutines not supported";
return;
}
for(int i = 0; i < 2; ++i)
{
Coroutine<int()> function;
{
Int a;
a = 4;
}
auto coroutine = function();
int out;
EXPECT_EQ(coroutine->await(out), false);
}
}
// Test generating one coroutine, and executing it on multiple threads. This makes
// sure the implementation manages per-call instance data correctly.
TEST(ReactorUnitTests, Coroutines_Parallel)
{
if(!rr::Caps.CoroutinesSupported)
{
SUCCEED() << "Coroutines not supported";
return;
}
Coroutine<int()> function;
{
Yield(Int(0));
Yield(Int(1));
Int current = 1;
Int next = 1;
While(true)
{
Yield(next);
auto tmp = current + next;
current = next;
next = tmp;
}
}
// Must call on same thread that creates the coroutine
function.finalize();
std::vector<std::thread> threads;
const size_t numThreads = 100;
for(size_t t = 0; t < numThreads; ++t)
{
threads.emplace_back([&] {
auto coroutine = function();
for(size_t i = 0; i < fibonacci.size(); i++)
{
int out = 0;
EXPECT_EQ(coroutine->await(out), true);
EXPECT_EQ(out, fibonacci[i]);
}
});
}
for(auto &t : threads)
{
t.join();
}
}
template<typename TestFuncType, typename RefFuncType, typename TestValueType>
struct IntrinsicTestParams
{
std::function<TestFuncType> testFunc; // Function we're testing (Reactor)
std::function<RefFuncType> refFunc; // Reference function to test against (C)
std::vector<TestValueType> testValues; // Values to input to functions
};
using IntrinsicTestParams_Float = IntrinsicTestParams<RValue<Float>(RValue<Float>), float(float), float>;
using IntrinsicTestParams_Float4 = IntrinsicTestParams<RValue<Float4>(RValue<Float4>), float(float), float>;
using IntrinsicTestParams_Float4_Float4 = IntrinsicTestParams<RValue<Float4>(RValue<Float4>, RValue<Float4>), float(float, float), std::pair<float, float>>;
struct IntrinsicTest_Float : public testing::TestWithParam<IntrinsicTestParams_Float>
{
void test()
{
FunctionT<float(float)> function;
{
Return(GetParam().testFunc((Float(function.Arg<0>()))));
}
auto routine = function("one");
for(auto &&v : GetParam().testValues)
{
SCOPED_TRACE(v);
EXPECT_FLOAT_EQ(routine(v), GetParam().refFunc(v));
}
}
};
using float4 = float[4];
using int4 = int[4];
// TODO: Move to Reactor.hpp
template<>
struct rr::CToReactor<int[4]>
{
using type = Int4;
static Int4 cast(float[4]);
};
// Value type wrapper around a <type>[4] (i.e. float4, int4)
template<typename T>
struct type4_value
{
using E = typename std::remove_pointer_t<std::decay_t<T>>;
type4_value() = default;
explicit type4_value(E rep)
: v{ rep, rep, rep, rep }
{}
type4_value(E x, E y, E z, E w)
: v{ x, y, z, w }
{}
bool operator==(const type4_value &rhs) const
{
return std::equal(std::begin(v), std::end(v), rhs.v);
}
// For gtest printing
friend std::ostream &operator<<(std::ostream &os, const type4_value &value)
{
return os << "[" << value.v[0] << ", " << value.v[1] << ", " << value.v[2] << ", " << value.v[3] << "]";
}
T v;
};
using float4_value = type4_value<float4>;
using int4_value = type4_value<int4>;
// Invoke a void(type4_value<T>*) routine on &v.v, returning wrapped result in v
template<typename RoutineType, typename T>
type4_value<T> invokeRoutine(RoutineType &routine, type4_value<T> v)
{
routine(&v.v);
return v;
}
// Invoke a void(type4_value<T>*, type4_value<T>*) routine on &v1.v, &v2.v returning wrapped result in v1
template<typename RoutineType, typename T>
type4_value<T> invokeRoutine(RoutineType &routine, type4_value<T> v1, type4_value<T> v2)
{
routine(&v1.v, &v2.v);
return v1;
}
struct IntrinsicTest_Float4 : public testing::TestWithParam<IntrinsicTestParams_Float4>
{
void test()
{
FunctionT<void(float4 *)> function;
{
Pointer<Float4> a = function.Arg<0>();
*a = GetParam().testFunc(*a);
Return();
}
auto routine = function("one");
for(auto &&v : GetParam().testValues)
{
SCOPED_TRACE(v);
float4_value result = invokeRoutine(routine, float4_value{ v });
float4_value expected = float4_value{ GetParam().refFunc(v) };
EXPECT_FLOAT_EQ(result.v[0], expected.v[0]);
EXPECT_FLOAT_EQ(result.v[1], expected.v[1]);
EXPECT_FLOAT_EQ(result.v[2], expected.v[2]);
EXPECT_FLOAT_EQ(result.v[3], expected.v[3]);
}
}
};
struct IntrinsicTest_Float4_Float4 : public testing::TestWithParam<IntrinsicTestParams_Float4_Float4>
{
void test()
{
FunctionT<void(float4 *, float4 *)> function;
{
Pointer<Float4> a = function.Arg<0>();
Pointer<Float4> b = function.Arg<1>();
*a = GetParam().testFunc(*a, *b);
Return();
}
auto routine = function("one");
for(auto &&v : GetParam().testValues)
{
SCOPED_TRACE(v);
float4_value result = invokeRoutine(routine, float4_value{ v.first }, float4_value{ v.second });
float4_value expected = float4_value{ GetParam().refFunc(v.first, v.second) };
EXPECT_FLOAT_EQ(result.v[0], expected.v[0]);
EXPECT_FLOAT_EQ(result.v[1], expected.v[1]);
EXPECT_FLOAT_EQ(result.v[2], expected.v[2]);
EXPECT_FLOAT_EQ(result.v[3], expected.v[3]);
}
}
};
// clang-format off
INSTANTIATE_TEST_SUITE_P(IntrinsicTestParams_Float, IntrinsicTest_Float, testing::Values(
IntrinsicTestParams_Float{ [](Float v) { return rr::Exp2(v); }, exp2f, {0.f, 1.f, 12345.f} },
IntrinsicTestParams_Float{ [](Float v) { return rr::Log2(v); }, log2f, {0.f, 1.f, 12345.f} },
IntrinsicTestParams_Float{ [](Float v) { return rr::Sqrt(v); }, sqrtf, {0.f, 1.f, 12345.f} }
));
// clang-format on
// TODO(b/149110874) Use coshf/sinhf when we've implemented SpirV versions at the SpirV level
float vulkan_sinhf(float a)
{
return ((expf(a) - expf(-a)) / 2);
}
float vulkan_coshf(float a)
{
return ((expf(a) + expf(-a)) / 2);
}
// clang-format off
constexpr float PI = 3.141592653589793f;
INSTANTIATE_TEST_SUITE_P(IntrinsicTestParams_Float4, IntrinsicTest_Float4, testing::Values(
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Sin(v); }, sinf, {0.f, 1.f, PI, 12345.f} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Cos(v); }, cosf, {0.f, 1.f, PI, 12345.f} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Tan(v); }, tanf, {0.f, 1.f, PI, 12345.f} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Asin(v); }, asinf, {0.f, 1.f, -1.f} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Acos(v); }, acosf, {0.f, 1.f, -1.f} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Atan(v); }, atanf, {0.f, 1.f, PI, 12345.f} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Sinh(v); }, vulkan_sinhf, {0.f, 1.f, PI, 12345.f, 0x1.65a84ep6} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Cosh(v); }, vulkan_coshf, {0.f, 1.f, PI, 12345.f, 0x1.65a84ep6} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Tanh(v); }, tanhf, {0.f, 1.f, PI, 12345.f} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Asinh(v); }, asinhf, {0.f, 1.f, PI, 12345.f} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Acosh(v); }, acoshf, { 1.f, PI, 12345.f} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Atanh(v); }, atanhf, {0.f, 1.f, -1.f} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Exp(v); }, expf, {0.f, 1.f, PI, 12345.f} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Log(v); }, logf, {0.f, 1.f, PI, 12345.f} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Exp2(v); }, exp2f, {0.f, 1.f, PI, 12345.f} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Log2(v); }, log2f, {0.f, 1.f, PI, 12345.f} },
IntrinsicTestParams_Float4{ [](RValue<Float4> v) { return rr::Sqrt(v); }, sqrtf, {0.f, 1.f, PI, 12345.f} }
));
// clang-format on
// clang-format off
INSTANTIATE_TEST_SUITE_P(IntrinsicTestParams_Float4_Float4, IntrinsicTest_Float4_Float4, testing::Values(
IntrinsicTestParams_Float4_Float4{ [](RValue<Float4> v1, RValue<Float4> v2) { return Atan2(v1, v2); }, atan2f, { {0.f, 0.f}, {0.f, -1.f}, {-1.f, 0.f}, {12345.f, 12345.f} } },
IntrinsicTestParams_Float4_Float4{ [](RValue<Float4> v1, RValue<Float4> v2) { return Pow(v1, v2); }, powf, { {0.f, 0.f}, {0.f, -1.f}, {-1.f, 0.f}, {12345.f, 12345.f} } }
));
// clang-format on
TEST_P(IntrinsicTest_Float, Test)
{
test();
}
TEST_P(IntrinsicTest_Float4, Test)
{
test();
}
TEST_P(IntrinsicTest_Float4_Float4, Test)
{
test();
}
TEST(ReactorUnitTests, Intrinsics_Ctlz)
{
// ctlz: counts number of leading zeros
{
Function<UInt(UInt x)> function;
{
UInt x = function.Arg<0>();
Return(rr::Ctlz(x, false));
}
auto routine = function("one");
auto callable = (uint32_t(*)(uint32_t))routine->getEntry();
for(uint32_t i = 0; i < 31; ++i)
{
uint32_t result = callable(1 << i);
EXPECT_EQ(result, 31 - i);
}
// Input 0 should return 32 for isZeroUndef == false
{
uint32_t result = callable(0);
EXPECT_EQ(result, 32u);
}
}
{
Function<Void(Pointer<UInt4>, UInt x)> function;
{
Pointer<UInt4> out = function.Arg<0>();
UInt x = function.Arg<1>();
*out = rr::Ctlz(UInt4(x), false);
}
auto routine = function("one");
auto callable = (void (*)(uint32_t *, uint32_t))routine->getEntry();
uint32_t x[4];
for(uint32_t i = 0; i < 31; ++i)
{
callable(x, 1 << i);
EXPECT_EQ(x[0], 31 - i);
EXPECT_EQ(x[1], 31 - i);
EXPECT_EQ(x[2], 31 - i);
EXPECT_EQ(x[3], 31 - i);
}
// Input 0 should return 32 for isZeroUndef == false
{
callable(x, 0);
EXPECT_EQ(x[0], 32u);
EXPECT_EQ(x[1], 32u);
EXPECT_EQ(x[2], 32u);
EXPECT_EQ(x[3], 32u);
}
}
}
TEST(ReactorUnitTests, Intrinsics_Cttz)
{
// cttz: counts number of trailing zeros
{
Function<UInt(UInt x)> function;
{
UInt x = function.Arg<0>();
Return(rr::Cttz(x, false));
}
auto routine = function("one");
auto callable = (uint32_t(*)(uint32_t))routine->getEntry();
for(uint32_t i = 0; i < 31; ++i)
{
uint32_t result = callable(1 << i);
EXPECT_EQ(result, i);
}
// Input 0 should return 32 for isZeroUndef == false
{
uint32_t result = callable(0);
EXPECT_EQ(result, 32u);
}
}
{
Function<Void(Pointer<UInt4>, UInt x)> function;
{
Pointer<UInt4> out = function.Arg<0>();
UInt x = function.Arg<1>();
*out = rr::Cttz(UInt4(x), false);
}
auto routine = function("one");
auto callable = (void (*)(uint32_t *, uint32_t))routine->getEntry();
uint32_t x[4];
for(uint32_t i = 0; i < 31; ++i)
{
callable(x, 1 << i);
EXPECT_EQ(x[0], i);
EXPECT_EQ(x[1], i);
EXPECT_EQ(x[2], i);
EXPECT_EQ(x[3], i);
}
// Input 0 should return 32 for isZeroUndef == false
{
callable(x, 0);
EXPECT_EQ(x[0], 32u);
EXPECT_EQ(x[1], 32u);
EXPECT_EQ(x[2], 32u);
EXPECT_EQ(x[3], 32u);
}
}
}
TEST(ReactorUnitTests, Intrinsics_Scatter)
{
Function<Void(Pointer<Float> base, Pointer<Float4> val, Pointer<Int4> offsets)> function;
{
Pointer<Float> base = function.Arg<0>();
Pointer<Float4> val = function.Arg<1>();
Pointer<Int4> offsets = function.Arg<2>();
auto mask = Int4(~0, ~0, ~0, ~0);
unsigned int alignment = 1;
Scatter(base, *val, *offsets, mask, alignment);
}
float buffer[16] = { 0 };
constexpr auto elemSize = sizeof(buffer[0]);
int offsets[] = {
1 * elemSize,
6 * elemSize,
11 * elemSize,
13 * elemSize
};
float val[4] = { 10, 60, 110, 130 };
auto routine = function("one");
auto entry = (void (*)(float *, float *, int *))routine->getEntry();
entry(buffer, val, offsets);
EXPECT_EQ(buffer[offsets[0] / sizeof(buffer[0])], 10);
EXPECT_EQ(buffer[offsets[1] / sizeof(buffer[0])], 60);
EXPECT_EQ(buffer[offsets[2] / sizeof(buffer[0])], 110);
EXPECT_EQ(buffer[offsets[3] / sizeof(buffer[0])], 130);
}
TEST(ReactorUnitTests, Intrinsics_Gather)
{
Function<Void(Pointer<Float> base, Pointer<Int4> offsets, Pointer<Float4> result)> function;
{
Pointer<Float> base = function.Arg<0>();
Pointer<Int4> offsets = function.Arg<1>();
Pointer<Float4> result = function.Arg<2>();
auto mask = Int4(~0, ~0, ~0, ~0);
unsigned int alignment = 1;
bool zeroMaskedLanes = true;
*result = Gather(base, *offsets, mask, alignment, zeroMaskedLanes);
}
float buffer[] = {
0, 10, 20, 30,
40, 50, 60, 70,
80, 90, 100, 110,
120, 130, 140, 150
};
constexpr auto elemSize = sizeof(buffer[0]);
int offsets[] = {
1 * elemSize,
6 * elemSize,
11 * elemSize,
13 * elemSize
};
auto routine = function("one");
auto entry = (void (*)(float *, int *, float *))routine->getEntry();
float result[4] = {};
entry(buffer, offsets, result);
EXPECT_EQ(result[0], 10);
EXPECT_EQ(result[1], 60);
EXPECT_EQ(result[2], 110);
EXPECT_EQ(result[3], 130);
}
TEST(ReactorUnitTests, ExtractFromRValue)
{
Function<Void(Pointer<Int4> values, Pointer<Int4> result)> function;
{
Pointer<Int4> vIn = function.Arg<0>();
Pointer<Int4> resultIn = function.Arg<1>();
RValue<Int4> v = *vIn;
Int4 result(678);
If(Extract(v, 0) == 42)
{
result = Insert(result, 1, 0);
}
If(Extract(v, 1) == 42)
{
result = Insert(result, 1, 1);
}
*resultIn = result;
Return();
}
auto routine = function("one");
auto entry = (void (*)(int *, int *))routine->getEntry();
int v[4] = { 42, 42, 42, <