third_party/subzero/crosstest/test_sync_atomic_main.cpp - SwiftShader - Git at Google

 //===- subzero/crosstest/test_sync_atomic_main.cpp - Driver for tests -----===//
 //
 //                        The Subzero Code Generator
 //
 // This file is distributed under the University of Illinois Open Source
 // License. See LICENSE.TXT for details.
 //
 //===----------------------------------------------------------------------===//
 //
 // Driver for cross testing atomic intrinsics, via the sync builtins.
 //
 //===----------------------------------------------------------------------===//

 /* crosstest.py --test=test_sync_atomic.cpp --crosstest-bitcode=0 \
    --driver=test_sync_atomic_main.cpp --prefix=Subzero_ \
    --output=test_sync_atomic */

 #include <pthread.h>
 #include <stdint.h>

 #include <cerrno>
 #include <climits>
 #include <cstdlib>
 #include <cstring>
 #include <iostream>

 // Include test_sync_atomic.h twice - once normally, and once within the
 // Subzero_ namespace, corresponding to the llc and Subzero translated
 // object files, respectively.
 #include "test_sync_atomic.h"
 #include "xdefs.h"
 namespace Subzero_ {
 #include "test_sync_atomic.h"
 }

 volatile uint64 Values[] = {
     0, 1, 0x7e, 0x7f, 0x80, 0x81, 0xfe, 0xff, 0x7ffe, 0x7fff, 0x8000, 0x8001,
     0xfffe, 0xffff, 0x007fffff /*Max subnormal + */, 0x00800000 /*Min+ */,
     0x7f7fffff /*Max+ */, 0x7f800000 /*+Inf*/, 0xff800000 /*-Inf*/,
     0x7fa00000 /*SNaN*/, 0x7fc00000 /*QNaN*/, 0x7ffffffe, 0x7fffffff,
     0x80000000, 0x80000001, 0xfffffffe, 0xffffffff, 0x100000000ll,
     0x100000001ll, 0x000fffffffffffffll /*Max subnormal + */,
     0x0010000000000000ll /*Min+ */, 0x7fefffffffffffffll /*Max+ */,
     0x7ff0000000000000ll /*+Inf*/, 0xfff0000000000000ll /*-Inf*/,
     0x7ff0000000000001ll /*SNaN*/, 0x7ff8000000000000ll /*QNaN*/,
     0x7ffffffffffffffell, 0x7fffffffffffffffll, 0x8000000000000000ll,
     0x8000000000000001ll, 0xfffffffffffffffell, 0xffffffffffffffffll};

 const static size_t NumValues = sizeof(Values) / sizeof(*Values);

 struct {
   volatile uint8_t l8;
   volatile uint16_t l16;
   volatile uint32_t l32;
   volatile uint64 l64;
 } AtomicLocs;

 template <typename Type>
 void testAtomicRMW(volatile Type *AtomicLoc, size_t &TotalTests, size_t &Passes,
                    size_t &Failures) {
   typedef Type (*FuncType)(bool, volatile Type *, Type);
   static struct {
     const char *Name;
     FuncType FuncLlc;
     FuncType FuncSz;
   } Funcs[] = {
 #define X(inst)                                                                \
   { STR(inst), test_##inst, Subzero_::test_##inst }                            \
   , {STR(inst) "_alloca", test_alloca_##inst, Subzero_::test_alloca_##inst},   \
       {STR(inst) "_const", test_const_##inst, Subzero_::test_const_##inst},
       RMWOP_TABLE
 #undef X
   };
   const static size_t NumFuncs = sizeof(Funcs) / sizeof(*Funcs);

   for (size_t f = 0; f < NumFuncs; ++f) {
     for (size_t i = 0; i < NumValues; ++i) {
       Type Value1 = static_cast<Type>(Values[i]);
       for (size_t j = 0; j < NumValues; ++j) {
         Type Value2 = static_cast<Type>(Values[j]);
         for (size_t k = 0; k < 2; ++k) {
           bool fetch_first = k;
           ++TotalTests;
           *AtomicLoc = Value1;
           Type ResultSz1 = Funcs[f].FuncSz(fetch_first, AtomicLoc, Value2);
           Type ResultSz2 = *AtomicLoc;
           *AtomicLoc = Value1;
           Type ResultLlc1 = Funcs[f].FuncLlc(fetch_first, AtomicLoc, Value2);
           Type ResultLlc2 = *AtomicLoc;
           if (ResultSz1 == ResultLlc1 && ResultSz2 == ResultLlc2) {
             ++Passes;
           } else {
             ++Failures;
             std::cout << "test_" << Funcs[f].Name << (CHAR_BIT * sizeof(Type))
                       << "(" << fetch_first << ", "
                       << static_cast<uint64>(Value1) << ", "
                       << static_cast<uint64>(Value2)
                       << "): sz1=" << static_cast<uint64>(ResultSz1)
                       << " llc1=" << static_cast<uint64>(ResultLlc1)
                       << " sz2=" << static_cast<uint64>(ResultSz2)
                       << " llc2=" << static_cast<uint64>(ResultLlc2) << "\n";
           }
         }
       }
     }
   }
 }

 template <typename Type>
 void testValCompareAndSwap(volatile Type *AtomicLoc, size_t &TotalTests,
                            size_t &Passes, size_t &Failures) {
   typedef Type (*FuncType)(volatile Type *, Type, Type);
   static struct {
     const char *Name;
     FuncType FuncLlc;
     FuncType FuncSz;
   } Funcs[] = {{"val_cmp_swap", test_val_cmp_swap, Subzero_::test_val_cmp_swap},
                {"val_cmp_swap_loop", test_val_cmp_swap_loop,
                 Subzero_::test_val_cmp_swap_loop}};
   const static size_t NumFuncs = sizeof(Funcs) / sizeof(*Funcs);
   for (size_t f = 0; f < NumFuncs; ++f) {
     for (size_t i = 0; i < NumValues; ++i) {
       Type Value1 = static_cast<Type>(Values[i]);
       for (size_t j = 0; j < NumValues; ++j) {
         Type Value2 = static_cast<Type>(Values[j]);
         for (size_t f = 0; f < 2; ++f) {
           bool flip = f;
           ++TotalTests;
           *AtomicLoc = Value1;
           Type ResultSz1 =
               Funcs[f].FuncSz(AtomicLoc, flip ? Value2 : Value1, Value2);
           Type ResultSz2 = *AtomicLoc;
           *AtomicLoc = Value1;
           Type ResultLlc1 =
               Funcs[f].FuncLlc(AtomicLoc, flip ? Value2 : Value1, Value2);
           Type ResultLlc2 = *AtomicLoc;
           if (ResultSz1 == ResultLlc1 && ResultSz2 == ResultLlc2) {
             ++Passes;
           } else {
             ++Failures;
             std::cout << "test_" << Funcs[f].Name << (CHAR_BIT * sizeof(Type))
                       << "(" << static_cast<uint64>(Value1) << ", "
                       << static_cast<uint64>(Value2) << ", flip=" << flip
                       << "): sz1=" << static_cast<uint64>(ResultSz1)
                       << " llc1=" << static_cast<uint64>(ResultLlc1)
                       << " sz2=" << static_cast<uint64>(ResultSz2)
                       << " llc2=" << static_cast<uint64>(ResultLlc2) << "\n";
           }
         }
       }
     }
   }
 }

 template <typename Type> struct ThreadData {
   Type (*FuncPtr)(bool, volatile Type *, Type);
   bool Fetch;
   volatile Type *Ptr;
   Type Adjustment;
 };

 template <typename Type> void *threadWrapper(void *Data) {
 #if defined(ARM32) || defined(MIPS32)
   // Given that most of times these crosstests for ARM are run under qemu, we
   // set a lower NumReps to allow crosstests to complete within a reasonable
   // amount of time.
   static const size_t NumReps = 1000;
 #else  // ARM32 || MIPS32
   static const size_t NumReps = 8000;
 #endif // ARM32 || MIPS32

   ThreadData<Type> *TData = reinterpret_cast<ThreadData<Type> *>(Data);
   for (size_t i = 0; i < NumReps; ++i) {
     (void)TData->FuncPtr(TData->Fetch, TData->Ptr, TData->Adjustment);
   }
   return NULL;
 }

 template <typename Type>
 void testAtomicRMWThreads(volatile Type *AtomicLoc, size_t &TotalTests,
                           size_t &Passes, size_t &Failures) {
   typedef Type (*FuncType)(bool, volatile Type *, Type);
   static struct {
     const char *Name;
     FuncType FuncLlc;
     FuncType FuncSz;
   } Funcs[] = {
 #define X(inst)                                                                \
   { STR(inst), test_##inst, Subzero_::test_##inst }                            \
   , {STR(inst) "_alloca", test_alloca_##inst, Subzero_::test_alloca_##inst},
       RMWOP_TABLE
 #undef X
   };
   const static size_t NumFuncs = sizeof(Funcs) / sizeof(*Funcs);

   // Just test a few values, otherwise it takes a *really* long time.
   volatile uint64 ValuesSubset[] = {1, 0x7e, 0x000fffffffffffffffll};
   const size_t NumValuesSubset = sizeof(ValuesSubset) / sizeof(*ValuesSubset);

   for (size_t f = 0; f < NumFuncs; ++f) {
     for (size_t i = 0; i < NumValuesSubset; ++i) {
       Type Value1 = static_cast<Type>(ValuesSubset[i]);
       for (size_t j = 0; j < NumValuesSubset; ++j) {
         Type Value2 = static_cast<Type>(ValuesSubset[j]);
         bool fetch_first = true;
         ThreadData<Type> TDataSz = {Funcs[f].FuncSz, fetch_first, AtomicLoc,
                                     Value2};
         ThreadData<Type> TDataLlc = {Funcs[f].FuncLlc, fetch_first, AtomicLoc,
                                      Value2};
         ++TotalTests;
         const size_t NumThreads = 4;
         pthread_t t[NumThreads];
         pthread_attr_t attr[NumThreads];

         // Try N threads w/ just Llc.
         *AtomicLoc = Value1;
         for (size_t m = 0; m < NumThreads; ++m) {
           pthread_attr_init(&attr[m]);
           if (pthread_create(&t[m], &attr[m], &threadWrapper<Type>,
                              reinterpret_cast<void *>(&TDataLlc)) != 0) {
             std::cout << "pthread_create failed w/ " << strerror(errno) << "\n";
             abort();
           }
         }
         for (size_t m = 0; m < NumThreads; ++m) {
           pthread_join(t[m], NULL);
         }
         Type ResultLlc = *AtomicLoc;

         // Try N threads w/ both Sz and Llc.
         *AtomicLoc = Value1;
         for (size_t m = 0; m < NumThreads; ++m) {
           pthread_attr_init(&attr[m]);
           if (pthread_create(&t[m], &attr[m], &threadWrapper<Type>,
                              m % 2 == 0
                                  ? reinterpret_cast<void *>(&TDataLlc)
                                  : reinterpret_cast<void *>(&TDataSz)) != 0) {
             ++Failures;
             std::cout << "pthread_create failed w/ " << strerror(errno) << "\n";
             abort();
           }
         }
         for (size_t m = 0; m < NumThreads; ++m) {
           if (pthread_join(t[m], NULL) != 0) {
             ++Failures;
             std::cout << "pthread_join failed w/ " << strerror(errno) << "\n";
             abort();
           }
         }
         Type ResultMixed = *AtomicLoc;

         if (ResultLlc == ResultMixed) {
           ++Passes;
         } else {
           ++Failures;
           std::cout << "test_with_threads_" << Funcs[f].Name
                     << (8 * sizeof(Type)) << "(" << static_cast<uint64>(Value1)
                     << ", " << static_cast<uint64>(Value2)
                     << "): llc=" << static_cast<uint64>(ResultLlc)
                     << " mixed=" << static_cast<uint64>(ResultMixed) << "\n";
         }
       }
     }
   }
 }

 int main(int argc, char *argv[]) {
   size_t TotalTests = 0;
   size_t Passes = 0;
   size_t Failures = 0;

   testAtomicRMW<uint8_t>(&AtomicLocs.l8, TotalTests, Passes, Failures);
   testAtomicRMW<uint16_t>(&AtomicLocs.l16, TotalTests, Passes, Failures);
   testAtomicRMW<uint32_t>(&AtomicLocs.l32, TotalTests, Passes, Failures);
   testAtomicRMW<uint64>(&AtomicLocs.l64, TotalTests, Passes, Failures);
   testValCompareAndSwap<uint8_t>(&AtomicLocs.l8, TotalTests, Passes, Failures);
   testValCompareAndSwap<uint16_t>(&AtomicLocs.l16, TotalTests, Passes,
                                   Failures);
   testValCompareAndSwap<uint32_t>(&AtomicLocs.l32, TotalTests, Passes,
                                   Failures);
   testValCompareAndSwap<uint64>(&AtomicLocs.l64, TotalTests, Passes, Failures);
   testAtomicRMWThreads<uint8_t>(&AtomicLocs.l8, TotalTests, Passes, Failures);
   testAtomicRMWThreads<uint16_t>(&AtomicLocs.l16, TotalTests, Passes, Failures);
   testAtomicRMWThreads<uint32_t>(&AtomicLocs.l32, TotalTests, Passes, Failures);
   testAtomicRMWThreads<uint64>(&AtomicLocs.l64, TotalTests, Passes, Failures);

   std::cout << "TotalTests=" << TotalTests << " Passes=" << Passes
             << " Failures=" << Failures << "\n";
   return Failures;
 }
	//===- subzero/crosstest/test_sync_atomic_main.cpp - Driver for tests -----===//
	//
	// The Subzero Code Generator
	//
	// This file is distributed under the University of Illinois Open Source
	// License. See LICENSE.TXT for details.
	//
	//===----------------------------------------------------------------------===//
	//
	// Driver for cross testing atomic intrinsics, via the sync builtins.
	//
	//===----------------------------------------------------------------------===//

	/* crosstest.py --test=test_sync_atomic.cpp --crosstest-bitcode=0 \
	--driver=test_sync_atomic_main.cpp --prefix=Subzero_ \
	--output=test_sync_atomic */

	#include <pthread.h>
	#include <stdint.h>

	#include <cerrno>
	#include <climits>
	#include <cstdlib>
	#include <cstring>
	#include <iostream>

	// Include test_sync_atomic.h twice - once normally, and once within the
	// Subzero_ namespace, corresponding to the llc and Subzero translated
	// object files, respectively.
	#include "test_sync_atomic.h"
	#include "xdefs.h"
	namespace Subzero_ {
	#include "test_sync_atomic.h"
	}

	volatile uint64 Values[] = {
	0, 1, 0x7e, 0x7f, 0x80, 0x81, 0xfe, 0xff, 0x7ffe, 0x7fff, 0x8000, 0x8001,
	0xfffe, 0xffff, 0x007fffff /Max subnormal + /, 0x00800000 /Min+ /,
	0x7f7fffff /Max+ /, 0x7f800000 /+Inf/, 0xff800000 /-Inf/,
	0x7fa00000 /SNaN/, 0x7fc00000 /QNaN/, 0x7ffffffe, 0x7fffffff,
	0x80000000, 0x80000001, 0xfffffffe, 0xffffffff, 0x100000000ll,
	0x100000001ll, 0x000fffffffffffffll /Max subnormal + /,
	0x0010000000000000ll /Min+ /, 0x7fefffffffffffffll /Max+ /,
	0x7ff0000000000000ll /+Inf/, 0xfff0000000000000ll /-Inf/,
	0x7ff0000000000001ll /SNaN/, 0x7ff8000000000000ll /QNaN/,
	0x7ffffffffffffffell, 0x7fffffffffffffffll, 0x8000000000000000ll,
	0x8000000000000001ll, 0xfffffffffffffffell, 0xffffffffffffffffll};

	const static size_t NumValues = sizeof(Values) / sizeof(*Values);

	struct {
	volatile uint8_t l8;
	volatile uint16_t l16;
	volatile uint32_t l32;
	volatile uint64 l64;
	} AtomicLocs;

	template <typename Type>
	void testAtomicRMW(volatile Type *AtomicLoc, size_t &TotalTests, size_t &Passes,
	size_t &Failures) {
	typedef Type (FuncType)(bool, volatile Type , Type);
	static struct {
	const char *Name;
	FuncType FuncLlc;
	FuncType FuncSz;
	} Funcs[] = {
	#define X(inst) \
	{ STR(inst), test_##inst, Subzero_::test_##inst } \
	, {STR(inst) "_alloca", test_alloca_##inst, Subzero_::test_alloca_##inst}, \
	{STR(inst) "_const", test_const_##inst, Subzero_::test_const_##inst},
	RMWOP_TABLE
	#undef X
	};
	const static size_t NumFuncs = sizeof(Funcs) / sizeof(*Funcs);

	for (size_t f = 0; f < NumFuncs; ++f) {
	for (size_t i = 0; i < NumValues; ++i) {
	Type Value1 = static_cast<Type>(Values[i]);
	for (size_t j = 0; j < NumValues; ++j) {
	Type Value2 = static_cast<Type>(Values[j]);
	for (size_t k = 0; k < 2; ++k) {
	bool fetch_first = k;
	++TotalTests;
	*AtomicLoc = Value1;
	Type ResultSz1 = Funcs[f].FuncSz(fetch_first, AtomicLoc, Value2);
	Type ResultSz2 = *AtomicLoc;
	*AtomicLoc = Value1;
	Type ResultLlc1 = Funcs[f].FuncLlc(fetch_first, AtomicLoc, Value2);
	Type ResultLlc2 = *AtomicLoc;
	if (ResultSz1 == ResultLlc1 && ResultSz2 == ResultLlc2) {
	++Passes;
	} else {
	++Failures;
	std::cout << "test_" << Funcs[f].Name << (CHAR_BIT * sizeof(Type))
	<< "(" << fetch_first << ", "
	<< static_cast<uint64>(Value1) << ", "
	<< static_cast<uint64>(Value2)
	<< "): sz1=" << static_cast<uint64>(ResultSz1)
	<< " llc1=" << static_cast<uint64>(ResultLlc1)
	<< " sz2=" << static_cast<uint64>(ResultSz2)
	<< " llc2=" << static_cast<uint64>(ResultLlc2) << "\n";
	}
	}
	}
	}
	}
	}

	template <typename Type>
	void testValCompareAndSwap(volatile Type *AtomicLoc, size_t &TotalTests,
	size_t &Passes, size_t &Failures) {
	typedef Type (FuncType)(volatile Type , Type, Type);
	static struct {
	const char *Name;
	FuncType FuncLlc;
	FuncType FuncSz;
	} Funcs[] = {{"val_cmp_swap", test_val_cmp_swap, Subzero_::test_val_cmp_swap},
	{"val_cmp_swap_loop", test_val_cmp_swap_loop,
	Subzero_::test_val_cmp_swap_loop}};
	const static size_t NumFuncs = sizeof(Funcs) / sizeof(*Funcs);
	for (size_t f = 0; f < NumFuncs; ++f) {
	for (size_t i = 0; i < NumValues; ++i) {
	Type Value1 = static_cast<Type>(Values[i]);
	for (size_t j = 0; j < NumValues; ++j) {
	Type Value2 = static_cast<Type>(Values[j]);
	for (size_t f = 0; f < 2; ++f) {
	bool flip = f;
	++TotalTests;
	*AtomicLoc = Value1;
	Type ResultSz1 =
	Funcs[f].FuncSz(AtomicLoc, flip ? Value2 : Value1, Value2);
	Type ResultSz2 = *AtomicLoc;
	*AtomicLoc = Value1;
	Type ResultLlc1 =
	Funcs[f].FuncLlc(AtomicLoc, flip ? Value2 : Value1, Value2);
	Type ResultLlc2 = *AtomicLoc;
	if (ResultSz1 == ResultLlc1 && ResultSz2 == ResultLlc2) {
	++Passes;
	} else {
	++Failures;
	std::cout << "test_" << Funcs[f].Name << (CHAR_BIT * sizeof(Type))
	<< "(" << static_cast<uint64>(Value1) << ", "
	<< static_cast<uint64>(Value2) << ", flip=" << flip
	<< "): sz1=" << static_cast<uint64>(ResultSz1)
	<< " llc1=" << static_cast<uint64>(ResultLlc1)
	<< " sz2=" << static_cast<uint64>(ResultSz2)
	<< " llc2=" << static_cast<uint64>(ResultLlc2) << "\n";
	}
	}
	}
	}
	}
	}

	template <typename Type> struct ThreadData {
	Type (FuncPtr)(bool, volatile Type , Type);
	bool Fetch;
	volatile Type *Ptr;
	Type Adjustment;
	};

	template <typename Type> void threadWrapper(void Data) {
	#if defined(ARM32) \|\| defined(MIPS32)
	// Given that most of times these crosstests for ARM are run under qemu, we
	// set a lower NumReps to allow crosstests to complete within a reasonable
	// amount of time.
	static const size_t NumReps = 1000;
	#else // ARM32 \|\| MIPS32
	static const size_t NumReps = 8000;
	#endif // ARM32 \|\| MIPS32

	ThreadData<Type> TData = reinterpret_cast<ThreadData<Type> >(Data);
	for (size_t i = 0; i < NumReps; ++i) {
	(void)TData->FuncPtr(TData->Fetch, TData->Ptr, TData->Adjustment);
	}
	return NULL;
	}

	template <typename Type>
	void testAtomicRMWThreads(volatile Type *AtomicLoc, size_t &TotalTests,
	size_t &Passes, size_t &Failures) {
	typedef Type (FuncType)(bool, volatile Type , Type);
	static struct {
	const char *Name;
	FuncType FuncLlc;
	FuncType FuncSz;
	} Funcs[] = {
	#define X(inst) \
	{ STR(inst), test_##inst, Subzero_::test_##inst } \
	, {STR(inst) "_alloca", test_alloca_##inst, Subzero_::test_alloca_##inst},
	RMWOP_TABLE
	#undef X
	};
	const static size_t NumFuncs = sizeof(Funcs) / sizeof(*Funcs);

	// Just test a few values, otherwise it takes a really long time.
	volatile uint64 ValuesSubset[] = {1, 0x7e, 0x000fffffffffffffffll};
	const size_t NumValuesSubset = sizeof(ValuesSubset) / sizeof(*ValuesSubset);

	for (size_t f = 0; f < NumFuncs; ++f) {
	for (size_t i = 0; i < NumValuesSubset; ++i) {
	Type Value1 = static_cast<Type>(ValuesSubset[i]);
	for (size_t j = 0; j < NumValuesSubset; ++j) {
	Type Value2 = static_cast<Type>(ValuesSubset[j]);
	bool fetch_first = true;
	ThreadData<Type> TDataSz = {Funcs[f].FuncSz, fetch_first, AtomicLoc,
	Value2};
	ThreadData<Type> TDataLlc = {Funcs[f].FuncLlc, fetch_first, AtomicLoc,
	Value2};
	++TotalTests;
	const size_t NumThreads = 4;
	pthread_t t[NumThreads];
	pthread_attr_t attr[NumThreads];

	// Try N threads w/ just Llc.
	*AtomicLoc = Value1;
	for (size_t m = 0; m < NumThreads; ++m) {
	pthread_attr_init(&attr[m]);
	if (pthread_create(&t[m], &attr[m], &threadWrapper<Type>,
	reinterpret_cast<void *>(&TDataLlc)) != 0) {
	std::cout << "pthread_create failed w/ " << strerror(errno) << "\n";
	abort();
	}
	}
	for (size_t m = 0; m < NumThreads; ++m) {
	pthread_join(t[m], NULL);
	}
	Type ResultLlc = *AtomicLoc;

	// Try N threads w/ both Sz and Llc.
	*AtomicLoc = Value1;
	for (size_t m = 0; m < NumThreads; ++m) {
	pthread_attr_init(&attr[m]);
	if (pthread_create(&t[m], &attr[m], &threadWrapper<Type>,
	m % 2 == 0
	? reinterpret_cast<void *>(&TDataLlc)
	: reinterpret_cast<void *>(&TDataSz)) != 0) {
	++Failures;
	std::cout << "pthread_create failed w/ " << strerror(errno) << "\n";
	abort();
	}
	}
	for (size_t m = 0; m < NumThreads; ++m) {
	if (pthread_join(t[m], NULL) != 0) {
	++Failures;
	std::cout << "pthread_join failed w/ " << strerror(errno) << "\n";
	abort();
	}
	}
	Type ResultMixed = *AtomicLoc;

	if (ResultLlc == ResultMixed) {
	++Passes;
	} else {
	++Failures;
	std::cout << "test_with_threads_" << Funcs[f].Name
	<< (8 * sizeof(Type)) << "(" << static_cast<uint64>(Value1)
	<< ", " << static_cast<uint64>(Value2)
	<< "): llc=" << static_cast<uint64>(ResultLlc)
	<< " mixed=" << static_cast<uint64>(ResultMixed) << "\n";
	}
	}
	}
	}
	}

	int main(int argc, char *argv[]) {
	size_t TotalTests = 0;
	size_t Passes = 0;
	size_t Failures = 0;

	testAtomicRMW<uint8_t>(&AtomicLocs.l8, TotalTests, Passes, Failures);
	testAtomicRMW<uint16_t>(&AtomicLocs.l16, TotalTests, Passes, Failures);
	testAtomicRMW<uint32_t>(&AtomicLocs.l32, TotalTests, Passes, Failures);
	testAtomicRMW<uint64>(&AtomicLocs.l64, TotalTests, Passes, Failures);
	testValCompareAndSwap<uint8_t>(&AtomicLocs.l8, TotalTests, Passes, Failures);
	testValCompareAndSwap<uint16_t>(&AtomicLocs.l16, TotalTests, Passes,
	Failures);
	testValCompareAndSwap<uint32_t>(&AtomicLocs.l32, TotalTests, Passes,
	Failures);
	testValCompareAndSwap<uint64>(&AtomicLocs.l64, TotalTests, Passes, Failures);
	testAtomicRMWThreads<uint8_t>(&AtomicLocs.l8, TotalTests, Passes, Failures);
	testAtomicRMWThreads<uint16_t>(&AtomicLocs.l16, TotalTests, Passes, Failures);
	testAtomicRMWThreads<uint32_t>(&AtomicLocs.l32, TotalTests, Passes, Failures);
	testAtomicRMWThreads<uint64>(&AtomicLocs.l64, TotalTests, Passes, Failures);

	std::cout << "TotalTests=" << TotalTests << " Passes=" << Passes
	<< " Failures=" << Failures << "\n";
	return Failures;
	}