|  | //===- subzero/crosstest/test_sync_atomic_main.cpp - Driver for tests -----===// | 
|  | // | 
|  | //                        The Subzero Code Generator | 
|  | // | 
|  | // This file is distributed under the University of Illinois Open Source | 
|  | // License. See LICENSE.TXT for details. | 
|  | // | 
|  | //===----------------------------------------------------------------------===// | 
|  | // | 
|  | // Driver for cross testing atomic intrinsics, via the sync builtins. | 
|  | // | 
|  | //===----------------------------------------------------------------------===// | 
|  |  | 
|  | /* crosstest.py --test=test_sync_atomic.cpp --crosstest-bitcode=0 \ | 
|  | --driver=test_sync_atomic_main.cpp --prefix=Subzero_ \ | 
|  | --output=test_sync_atomic */ | 
|  |  | 
|  | #include <pthread.h> | 
|  | #include <stdint.h> | 
|  |  | 
|  | #include <cerrno> | 
|  | #include <climits> | 
|  | #include <cstdlib> | 
|  | #include <cstring> | 
|  | #include <iostream> | 
|  |  | 
|  | // Include test_sync_atomic.h twice - once normally, and once within the | 
|  | // Subzero_ namespace, corresponding to the llc and Subzero translated | 
|  | // object files, respectively. | 
|  | #include "test_sync_atomic.h" | 
|  | #include "xdefs.h" | 
|  | namespace Subzero_ { | 
|  | #include "test_sync_atomic.h" | 
|  | } | 
|  |  | 
|  | volatile uint64 Values[] = { | 
|  | 0, 1, 0x7e, 0x7f, 0x80, 0x81, 0xfe, 0xff, 0x7ffe, 0x7fff, 0x8000, 0x8001, | 
|  | 0xfffe, 0xffff, 0x007fffff /*Max subnormal + */, 0x00800000 /*Min+ */, | 
|  | 0x7f7fffff /*Max+ */, 0x7f800000 /*+Inf*/, 0xff800000 /*-Inf*/, | 
|  | 0x7fa00000 /*SNaN*/, 0x7fc00000 /*QNaN*/, 0x7ffffffe, 0x7fffffff, | 
|  | 0x80000000, 0x80000001, 0xfffffffe, 0xffffffff, 0x100000000ll, | 
|  | 0x100000001ll, 0x000fffffffffffffll /*Max subnormal + */, | 
|  | 0x0010000000000000ll /*Min+ */, 0x7fefffffffffffffll /*Max+ */, | 
|  | 0x7ff0000000000000ll /*+Inf*/, 0xfff0000000000000ll /*-Inf*/, | 
|  | 0x7ff0000000000001ll /*SNaN*/, 0x7ff8000000000000ll /*QNaN*/, | 
|  | 0x7ffffffffffffffell, 0x7fffffffffffffffll, 0x8000000000000000ll, | 
|  | 0x8000000000000001ll, 0xfffffffffffffffell, 0xffffffffffffffffll}; | 
|  |  | 
|  | const static size_t NumValues = sizeof(Values) / sizeof(*Values); | 
|  |  | 
|  | struct { | 
|  | volatile uint8_t l8; | 
|  | volatile uint16_t l16; | 
|  | volatile uint32_t l32; | 
|  | volatile uint64 l64; | 
|  | } AtomicLocs; | 
|  |  | 
|  | template <typename Type> | 
|  | void testAtomicRMW(volatile Type *AtomicLoc, size_t &TotalTests, size_t &Passes, | 
|  | size_t &Failures) { | 
|  | typedef Type (*FuncType)(bool, volatile Type *, Type); | 
|  | static struct { | 
|  | const char *Name; | 
|  | FuncType FuncLlc; | 
|  | FuncType FuncSz; | 
|  | } Funcs[] = { | 
|  | #define X(inst)                                                                \ | 
|  | { STR(inst), test_##inst, Subzero_::test_##inst }                            \ | 
|  | , {STR(inst) "_alloca", test_alloca_##inst, Subzero_::test_alloca_##inst},   \ | 
|  | {STR(inst) "_const", test_const_##inst, Subzero_::test_const_##inst}, | 
|  | RMWOP_TABLE | 
|  | #undef X | 
|  | }; | 
|  | const static size_t NumFuncs = sizeof(Funcs) / sizeof(*Funcs); | 
|  |  | 
|  | for (size_t f = 0; f < NumFuncs; ++f) { | 
|  | for (size_t i = 0; i < NumValues; ++i) { | 
|  | Type Value1 = static_cast<Type>(Values[i]); | 
|  | for (size_t j = 0; j < NumValues; ++j) { | 
|  | Type Value2 = static_cast<Type>(Values[j]); | 
|  | for (size_t k = 0; k < 2; ++k) { | 
|  | bool fetch_first = k; | 
|  | ++TotalTests; | 
|  | *AtomicLoc = Value1; | 
|  | Type ResultSz1 = Funcs[f].FuncSz(fetch_first, AtomicLoc, Value2); | 
|  | Type ResultSz2 = *AtomicLoc; | 
|  | *AtomicLoc = Value1; | 
|  | Type ResultLlc1 = Funcs[f].FuncLlc(fetch_first, AtomicLoc, Value2); | 
|  | Type ResultLlc2 = *AtomicLoc; | 
|  | if (ResultSz1 == ResultLlc1 && ResultSz2 == ResultLlc2) { | 
|  | ++Passes; | 
|  | } else { | 
|  | ++Failures; | 
|  | std::cout << "test_" << Funcs[f].Name << (CHAR_BIT * sizeof(Type)) | 
|  | << "(" << fetch_first << ", " | 
|  | << static_cast<uint64>(Value1) << ", " | 
|  | << static_cast<uint64>(Value2) | 
|  | << "): sz1=" << static_cast<uint64>(ResultSz1) | 
|  | << " llc1=" << static_cast<uint64>(ResultLlc1) | 
|  | << " sz2=" << static_cast<uint64>(ResultSz2) | 
|  | << " llc2=" << static_cast<uint64>(ResultLlc2) << "\n"; | 
|  | } | 
|  | } | 
|  | } | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | template <typename Type> | 
|  | void testValCompareAndSwap(volatile Type *AtomicLoc, size_t &TotalTests, | 
|  | size_t &Passes, size_t &Failures) { | 
|  | typedef Type (*FuncType)(volatile Type *, Type, Type); | 
|  | static struct { | 
|  | const char *Name; | 
|  | FuncType FuncLlc; | 
|  | FuncType FuncSz; | 
|  | } Funcs[] = {{"val_cmp_swap", test_val_cmp_swap, Subzero_::test_val_cmp_swap}, | 
|  | {"val_cmp_swap_loop", test_val_cmp_swap_loop, | 
|  | Subzero_::test_val_cmp_swap_loop}}; | 
|  | const static size_t NumFuncs = sizeof(Funcs) / sizeof(*Funcs); | 
|  | for (size_t f = 0; f < NumFuncs; ++f) { | 
|  | for (size_t i = 0; i < NumValues; ++i) { | 
|  | Type Value1 = static_cast<Type>(Values[i]); | 
|  | for (size_t j = 0; j < NumValues; ++j) { | 
|  | Type Value2 = static_cast<Type>(Values[j]); | 
|  | for (size_t f = 0; f < 2; ++f) { | 
|  | bool flip = f; | 
|  | ++TotalTests; | 
|  | *AtomicLoc = Value1; | 
|  | Type ResultSz1 = | 
|  | Funcs[f].FuncSz(AtomicLoc, flip ? Value2 : Value1, Value2); | 
|  | Type ResultSz2 = *AtomicLoc; | 
|  | *AtomicLoc = Value1; | 
|  | Type ResultLlc1 = | 
|  | Funcs[f].FuncLlc(AtomicLoc, flip ? Value2 : Value1, Value2); | 
|  | Type ResultLlc2 = *AtomicLoc; | 
|  | if (ResultSz1 == ResultLlc1 && ResultSz2 == ResultLlc2) { | 
|  | ++Passes; | 
|  | } else { | 
|  | ++Failures; | 
|  | std::cout << "test_" << Funcs[f].Name << (CHAR_BIT * sizeof(Type)) | 
|  | << "(" << static_cast<uint64>(Value1) << ", " | 
|  | << static_cast<uint64>(Value2) << ", flip=" << flip | 
|  | << "): sz1=" << static_cast<uint64>(ResultSz1) | 
|  | << " llc1=" << static_cast<uint64>(ResultLlc1) | 
|  | << " sz2=" << static_cast<uint64>(ResultSz2) | 
|  | << " llc2=" << static_cast<uint64>(ResultLlc2) << "\n"; | 
|  | } | 
|  | } | 
|  | } | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | template <typename Type> struct ThreadData { | 
|  | Type (*FuncPtr)(bool, volatile Type *, Type); | 
|  | bool Fetch; | 
|  | volatile Type *Ptr; | 
|  | Type Adjustment; | 
|  | }; | 
|  |  | 
|  | template <typename Type> void *threadWrapper(void *Data) { | 
|  | #if defined(ARM32) || defined(MIPS32) | 
|  | // Given that most of times these crosstests for ARM are run under qemu, we | 
|  | // set a lower NumReps to allow crosstests to complete within a reasonable | 
|  | // amount of time. | 
|  | static const size_t NumReps = 1000; | 
|  | #else  // ARM32 || MIPS32 | 
|  | static const size_t NumReps = 8000; | 
|  | #endif // ARM32 || MIPS32 | 
|  |  | 
|  | ThreadData<Type> *TData = reinterpret_cast<ThreadData<Type> *>(Data); | 
|  | for (size_t i = 0; i < NumReps; ++i) { | 
|  | (void)TData->FuncPtr(TData->Fetch, TData->Ptr, TData->Adjustment); | 
|  | } | 
|  | return NULL; | 
|  | } | 
|  |  | 
|  | template <typename Type> | 
|  | void testAtomicRMWThreads(volatile Type *AtomicLoc, size_t &TotalTests, | 
|  | size_t &Passes, size_t &Failures) { | 
|  | typedef Type (*FuncType)(bool, volatile Type *, Type); | 
|  | static struct { | 
|  | const char *Name; | 
|  | FuncType FuncLlc; | 
|  | FuncType FuncSz; | 
|  | } Funcs[] = { | 
|  | #define X(inst)                                                                \ | 
|  | { STR(inst), test_##inst, Subzero_::test_##inst }                            \ | 
|  | , {STR(inst) "_alloca", test_alloca_##inst, Subzero_::test_alloca_##inst}, | 
|  | RMWOP_TABLE | 
|  | #undef X | 
|  | }; | 
|  | const static size_t NumFuncs = sizeof(Funcs) / sizeof(*Funcs); | 
|  |  | 
|  | // Just test a few values, otherwise it takes a *really* long time. | 
|  | volatile uint64 ValuesSubset[] = {1, 0x7e, 0x000fffffffffffffffll}; | 
|  | const size_t NumValuesSubset = sizeof(ValuesSubset) / sizeof(*ValuesSubset); | 
|  |  | 
|  | for (size_t f = 0; f < NumFuncs; ++f) { | 
|  | for (size_t i = 0; i < NumValuesSubset; ++i) { | 
|  | Type Value1 = static_cast<Type>(ValuesSubset[i]); | 
|  | for (size_t j = 0; j < NumValuesSubset; ++j) { | 
|  | Type Value2 = static_cast<Type>(ValuesSubset[j]); | 
|  | bool fetch_first = true; | 
|  | ThreadData<Type> TDataSz = {Funcs[f].FuncSz, fetch_first, AtomicLoc, | 
|  | Value2}; | 
|  | ThreadData<Type> TDataLlc = {Funcs[f].FuncLlc, fetch_first, AtomicLoc, | 
|  | Value2}; | 
|  | ++TotalTests; | 
|  | const size_t NumThreads = 4; | 
|  | pthread_t t[NumThreads]; | 
|  | pthread_attr_t attr[NumThreads]; | 
|  |  | 
|  | // Try N threads w/ just Llc. | 
|  | *AtomicLoc = Value1; | 
|  | for (size_t m = 0; m < NumThreads; ++m) { | 
|  | pthread_attr_init(&attr[m]); | 
|  | if (pthread_create(&t[m], &attr[m], &threadWrapper<Type>, | 
|  | reinterpret_cast<void *>(&TDataLlc)) != 0) { | 
|  | std::cout << "pthread_create failed w/ " << strerror(errno) << "\n"; | 
|  | abort(); | 
|  | } | 
|  | } | 
|  | for (size_t m = 0; m < NumThreads; ++m) { | 
|  | pthread_join(t[m], NULL); | 
|  | } | 
|  | Type ResultLlc = *AtomicLoc; | 
|  |  | 
|  | // Try N threads w/ both Sz and Llc. | 
|  | *AtomicLoc = Value1; | 
|  | for (size_t m = 0; m < NumThreads; ++m) { | 
|  | pthread_attr_init(&attr[m]); | 
|  | if (pthread_create(&t[m], &attr[m], &threadWrapper<Type>, | 
|  | m % 2 == 0 | 
|  | ? reinterpret_cast<void *>(&TDataLlc) | 
|  | : reinterpret_cast<void *>(&TDataSz)) != 0) { | 
|  | ++Failures; | 
|  | std::cout << "pthread_create failed w/ " << strerror(errno) << "\n"; | 
|  | abort(); | 
|  | } | 
|  | } | 
|  | for (size_t m = 0; m < NumThreads; ++m) { | 
|  | if (pthread_join(t[m], NULL) != 0) { | 
|  | ++Failures; | 
|  | std::cout << "pthread_join failed w/ " << strerror(errno) << "\n"; | 
|  | abort(); | 
|  | } | 
|  | } | 
|  | Type ResultMixed = *AtomicLoc; | 
|  |  | 
|  | if (ResultLlc == ResultMixed) { | 
|  | ++Passes; | 
|  | } else { | 
|  | ++Failures; | 
|  | std::cout << "test_with_threads_" << Funcs[f].Name | 
|  | << (8 * sizeof(Type)) << "(" << static_cast<uint64>(Value1) | 
|  | << ", " << static_cast<uint64>(Value2) | 
|  | << "): llc=" << static_cast<uint64>(ResultLlc) | 
|  | << " mixed=" << static_cast<uint64>(ResultMixed) << "\n"; | 
|  | } | 
|  | } | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | int main(int argc, char *argv[]) { | 
|  | size_t TotalTests = 0; | 
|  | size_t Passes = 0; | 
|  | size_t Failures = 0; | 
|  |  | 
|  | testAtomicRMW<uint8_t>(&AtomicLocs.l8, TotalTests, Passes, Failures); | 
|  | testAtomicRMW<uint16_t>(&AtomicLocs.l16, TotalTests, Passes, Failures); | 
|  | testAtomicRMW<uint32_t>(&AtomicLocs.l32, TotalTests, Passes, Failures); | 
|  | testAtomicRMW<uint64>(&AtomicLocs.l64, TotalTests, Passes, Failures); | 
|  | testValCompareAndSwap<uint8_t>(&AtomicLocs.l8, TotalTests, Passes, Failures); | 
|  | testValCompareAndSwap<uint16_t>(&AtomicLocs.l16, TotalTests, Passes, | 
|  | Failures); | 
|  | testValCompareAndSwap<uint32_t>(&AtomicLocs.l32, TotalTests, Passes, | 
|  | Failures); | 
|  | testValCompareAndSwap<uint64>(&AtomicLocs.l64, TotalTests, Passes, Failures); | 
|  | testAtomicRMWThreads<uint8_t>(&AtomicLocs.l8, TotalTests, Passes, Failures); | 
|  | testAtomicRMWThreads<uint16_t>(&AtomicLocs.l16, TotalTests, Passes, Failures); | 
|  | testAtomicRMWThreads<uint32_t>(&AtomicLocs.l32, TotalTests, Passes, Failures); | 
|  | testAtomicRMWThreads<uint64>(&AtomicLocs.l64, TotalTests, Passes, Failures); | 
|  |  | 
|  | std::cout << "TotalTests=" << TotalTests << " Passes=" << Passes | 
|  | << " Failures=" << Failures << "\n"; | 
|  | return Failures; | 
|  | } |