Subzero: add REACTOR_EMIT_PRINT_LOCATION support Adds support for emitting print locations when using the Subzero backend. Very useful for debugging. Bug: b/149572931 Change-Id: I32fc14486cd7a021f424fb926dc776072374b931 Reviewed-on: https://swiftshader-review.googlesource.com/c/SwiftShader/+/41288 Tested-by: Antonio Maiorano <amaiorano@google.com> Reviewed-by: Ben Clayton <bclayton@google.com>

commit: aae33735e69931106bed4a6d5a32bfcc4631dee2 [log] [tgz]
author: Antonio Maiorano <amaiorano@google.com> Fri Feb 14 14:52:34 2020 -0500
committer: Antonio Maiorano <amaiorano@google.com> Mon Feb 17 20:03:34 2020 +0000
tree: debba0ffa0fad4dc3f13bb0799468b58a1d9beed
parent: d42d2fd9c9e2212b4804b72867051be0d41c219f [diff]
diff --git a/src/Reactor/LLVMReactor.cpp b/src/Reactor/LLVMReactor.cpp
index 7f780a6..4879076 100644
--- a/src/Reactor/LLVMReactor.cpp
+++ b/src/Reactor/LLVMReactor.cpp

@@ -1109,6 +1109,8 @@
 
 Value *Nucleus::createMaskedLoad(Value *ptr, Type *elTy, Value *mask, unsigned int alignment, bool zeroMaskedLanes)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
+
 	ASSERT(V(ptr)->getType()->isPointerTy());
 	ASSERT(V(mask)->getType()->isVectorTy());
 
@@ -1126,6 +1128,8 @@
 
 void Nucleus::createMaskedStore(Value *ptr, Value *val, Value *mask, unsigned int alignment)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
+
 	ASSERT(V(ptr)->getType()->isPointerTy());
 	ASSERT(V(val)->getType()->isVectorTy());
 	ASSERT(V(mask)->getType()->isVectorTy());
@@ -1163,6 +1167,7 @@
 
 void Nucleus::createFence(std::memory_order memoryOrder)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	jit->builder->CreateFence(atomicOrdering(true, memoryOrder));
 }
 
@@ -1658,6 +1663,7 @@
 
 Value *Nucleus::createConstantVector(const int64_t *constants, Type *type)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	ASSERT(llvm::isa<llvm::VectorType>(T(type)));
 	const int numConstants = elementCount(type);                                      // Number of provided constants for the (emulated) type.
 	const int numElements = llvm::cast<llvm::VectorType>(T(type))->getNumElements();  // Number of elements of the underlying vector type.
@@ -1674,6 +1680,7 @@
 
 Value *Nucleus::createConstantVector(const double *constants, Type *type)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	ASSERT(llvm::isa<llvm::VectorType>(T(type)));
 	const int numConstants = elementCount(type);                                      // Number of provided constants for the (emulated) type.
 	const int numElements = llvm::cast<llvm::VectorType>(T(type))->getNumElements();  // Number of elements of the underlying vector type.
@@ -1690,6 +1697,7 @@
 
 Value *Nucleus::createConstantString(const char *v)
 {
+	// NOTE: Do not call RR_DEBUG_INFO_UPDATE_LOC() here to avoid recursion when called from rr::Printv
 	auto ptr = jit->builder->CreateGlobalStringPtr(v);
 	return V(ptr);
 }
@@ -3152,18 +3160,21 @@
 
 RValue<Float4> Sin(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto func = llvm::Intrinsic::getDeclaration(jit->module.get(), llvm::Intrinsic::sin, { V(v.value)->getType() });
 	return RValue<Float4>(V(jit->builder->CreateCall(func, V(v.value))));
 }
 
 RValue<Float4> Cos(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto func = llvm::Intrinsic::getDeclaration(jit->module.get(), llvm::Intrinsic::cos, { V(v.value)->getType() });
 	return RValue<Float4>(V(jit->builder->CreateCall(func, V(v.value))));
 }
 
 RValue<Float4> Tan(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return Sin(v) / Cos(v);
 }
 
@@ -3182,51 +3193,61 @@
 
 RValue<Float4> Asin(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return TransformFloat4PerElement(v, "asinf");
 }
 
 RValue<Float4> Acos(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return TransformFloat4PerElement(v, "acosf");
 }
 
 RValue<Float4> Atan(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return TransformFloat4PerElement(v, "atanf");
 }
 
 RValue<Float4> Sinh(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Sinh(v);
 }
 
 RValue<Float4> Cosh(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Cosh(v);
 }
 
 RValue<Float4> Tanh(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return TransformFloat4PerElement(v, "tanhf");
 }
 
 RValue<Float4> Asinh(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return TransformFloat4PerElement(v, "asinhf");
 }
 
 RValue<Float4> Acosh(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return TransformFloat4PerElement(v, "acoshf");
 }
 
 RValue<Float4> Atanh(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return TransformFloat4PerElement(v, "atanhf");
 }
 
 RValue<Float4> Atan2(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	::llvm::SmallVector<::llvm::Type *, 2> paramTys;
 	paramTys.push_back(T(Float::getType()));
 	paramTys.push_back(T(Float::getType()));
@@ -3245,36 +3266,42 @@
 
 RValue<Float4> Pow(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto func = llvm::Intrinsic::getDeclaration(jit->module.get(), llvm::Intrinsic::pow, { T(Float4::getType()) });
 	return RValue<Float4>(V(jit->builder->CreateCall2(func, ARGS(V(x.value), V(y.value)))));
 }
 
 RValue<Float4> Exp(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto func = llvm::Intrinsic::getDeclaration(jit->module.get(), llvm::Intrinsic::exp, { T(Float4::getType()) });
 	return RValue<Float4>(V(jit->builder->CreateCall(func, V(v.value))));
 }
 
 RValue<Float4> Log(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto func = llvm::Intrinsic::getDeclaration(jit->module.get(), llvm::Intrinsic::log, { T(Float4::getType()) });
 	return RValue<Float4>(V(jit->builder->CreateCall(func, V(v.value))));
 }
 
 RValue<Float4> Exp2(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto func = llvm::Intrinsic::getDeclaration(jit->module.get(), llvm::Intrinsic::exp2, { T(Float4::getType()) });
 	return RValue<Float4>(V(jit->builder->CreateCall(func, V(v.value))));
 }
 
 RValue<Float4> Log2(RValue<Float4> v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto func = llvm::Intrinsic::getDeclaration(jit->module.get(), llvm::Intrinsic::log2, { T(Float4::getType()) });
 	return RValue<Float4>(V(jit->builder->CreateCall(func, V(v.value))));
 }
 
 RValue<UInt> Ctlz(RValue<UInt> v, bool isZeroUndef)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto func = llvm::Intrinsic::getDeclaration(jit->module.get(), llvm::Intrinsic::ctlz, { T(UInt::getType()) });
 	return RValue<UInt>(V(jit->builder->CreateCall2(func, ARGS(
 	                                                          V(v.value),
@@ -3283,6 +3310,7 @@
 
 RValue<UInt4> Ctlz(RValue<UInt4> v, bool isZeroUndef)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto func = llvm::Intrinsic::getDeclaration(jit->module.get(), llvm::Intrinsic::ctlz, { T(UInt4::getType()) });
 	return RValue<UInt4>(V(jit->builder->CreateCall2(func, ARGS(
 	                                                           V(v.value),
@@ -3291,6 +3319,7 @@
 
 RValue<UInt> Cttz(RValue<UInt> v, bool isZeroUndef)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto func = llvm::Intrinsic::getDeclaration(jit->module.get(), llvm::Intrinsic::cttz, { T(UInt::getType()) });
 	return RValue<UInt>(V(jit->builder->CreateCall2(func, ARGS(
 	                                                          V(v.value),
@@ -3299,6 +3328,7 @@
 
 RValue<UInt4> Cttz(RValue<UInt4> v, bool isZeroUndef)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto func = llvm::Intrinsic::getDeclaration(jit->module.get(), llvm::Intrinsic::cttz, { T(UInt4::getType()) });
 	return RValue<UInt4>(V(jit->builder->CreateCall2(func, ARGS(
 	                                                           V(v.value),
@@ -3340,6 +3370,7 @@
 
 RValue<Pointer<Byte>> ConstantPointer(void const *ptr)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	// Note: this should work for 32-bit pointers as well because 'inttoptr'
 	// is defined to truncate (and zero extend) if necessary.
 	auto ptrAsInt = ::llvm::ConstantInt::get(::llvm::Type::getInt64Ty(jit->context), reinterpret_cast<uintptr_t>(ptr));
@@ -3348,6 +3379,7 @@
 
 RValue<Pointer<Byte>> ConstantData(void const *data, size_t size)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto str = ::std::string(reinterpret_cast<const char *>(data), size);
 	auto ptr = jit->builder->CreateGlobalStringPtr(str);
 	return RValue<Pointer<Byte>>(V(ptr));
@@ -3355,6 +3387,7 @@
 
 Value *Call(RValue<Pointer<Byte>> fptr, Type *retTy, std::initializer_list<Value *> args, std::initializer_list<Type *> argTys)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	::llvm::SmallVector<::llvm::Type *, 8> paramTys;
 	for(auto ty : argTys) { paramTys.push_back(T(ty)); }
 	auto funcTy = ::llvm::FunctionType::get(T(retTy), paramTys, false);
@@ -3369,6 +3402,7 @@
 
 void Breakpoint()
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	llvm::Function *debugtrap = llvm::Intrinsic::getDeclaration(jit->module.get(), llvm::Intrinsic::debugtrap);
 
 	jit->builder->CreateCall(debugtrap);

diff --git a/src/Reactor/LLVMReactorDebugInfo.cpp b/src/Reactor/LLVMReactorDebugInfo.cpp
index 5810d44..31f1a37 100644
--- a/src/Reactor/LLVMReactorDebugInfo.cpp
+++ b/src/Reactor/LLVMReactorDebugInfo.cpp

@@ -134,17 +134,7 @@
 	builder->SetCurrentDebugLocation(getLocation(backtrace, backtrace.size() - 1));
 
 #	ifdef ENABLE_RR_EMIT_PRINT_LOCATION
-	static Location lastLocation;
-	if(backtrace.size() == 0)
-	{
-		return;
-	}
-	Location currLocation = backtrace[backtrace.size() - 1];
-	if(currLocation != lastLocation)
-	{
-		rr::Print("rr> {0} [{1}:{2}]\n", currLocation.function.name.c_str(), currLocation.function.file.c_str(), currLocation.line);
-		lastLocation = std::move(currLocation);
-	}
+	emitPrintLocation(backtrace);
 #	endif  // ENABLE_RR_EMIT_PRINT_LOCATION
 }
 
@@ -443,48 +433,14 @@
 	diTypes.emplace(T(Float4::getType()), diBuilder->createVectorType(128, 128, diTypes[T(Float::getType())], { vec4 }));
 }
 
-DebugInfo::Location DebugInfo::getCallerLocation() const
+Location DebugInfo::getCallerLocation() const
 {
 	return getCallerBacktrace(1)[0];
 }
 
-DebugInfo::Backtrace DebugInfo::getCallerBacktrace(size_t limit /* = 0 */) const
+Backtrace DebugInfo::getCallerBacktrace(size_t limit /* = 0 */) const
 {
-	auto shouldSkipFile = [](llvm::StringRef fileSR) {
-		return fileSR.empty() ||
-		       fileSR.endswith_lower("ReactorDebugInfo.cpp") ||
-		       fileSR.endswith_lower("Reactor.cpp") ||
-		       fileSR.endswith_lower("Reactor.hpp") ||
-		       fileSR.endswith_lower("stacktrace.hpp");
-	};
-
-	std::vector<DebugInfo::Location> locations;
-
-	// Note that bs::stacktrace() effectively returns a vector of addresses; bs::frame construction is where
-	// the heavy lifting is done: resolving the function name, file and line number.
-	namespace bs = boost::stacktrace;
-	for(bs::frame frame : bs::stacktrace())
-	{
-		if(shouldSkipFile(frame.source_file()))
-		{
-			continue;
-		}
-
-		DebugInfo::Location location;
-		location.function.file = frame.source_file();
-		location.function.name = frame.name();
-		location.line = frame.source_line();
-		locations.push_back(location);
-
-		if(limit > 0 && locations.size() >= limit)
-		{
-			break;
-		}
-	}
-
-	std::reverse(locations.begin(), locations.end());
-
-	return locations;
+	return rr::getCallerBacktrace(limit);
 }
 
 llvm::DIType *DebugInfo::getOrCreateType(llvm::Type *type)

diff --git a/src/Reactor/LLVMReactorDebugInfo.hpp b/src/Reactor/LLVMReactorDebugInfo.hpp
index 6f320aa..276f44a 100644
--- a/src/Reactor/LLVMReactorDebugInfo.hpp
+++ b/src/Reactor/LLVMReactorDebugInfo.hpp

@@ -16,6 +16,7 @@
 #define rr_LLVMReactorDebugInfo_hpp
 
 #include "Reactor.hpp"
+#include "ReactorDebugInfo.hpp"
 
 #ifdef ENABLE_RR_DEBUG_INFO
 
@@ -111,44 +112,6 @@
 
 	using LineTokens = std::unordered_map<unsigned int, Token>;
 
-	struct FunctionLocation
-	{
-		std::string name;
-		std::string file;
-
-		bool operator==(const FunctionLocation &rhs) const { return name == rhs.name && file == rhs.file; }
-		bool operator!=(const FunctionLocation &rhs) const { return !(*this == rhs); }
-
-		struct Hash
-		{
-			std::size_t operator()(const FunctionLocation &l) const noexcept
-			{
-				return std::hash<std::string>()(l.file) * 31 +
-				       std::hash<std::string>()(l.name);
-			}
-		};
-	};
-
-	struct Location
-	{
-		FunctionLocation function;
-		unsigned int line = 0;
-
-		bool operator==(const Location &rhs) const { return function == rhs.function && line == rhs.line; }
-		bool operator!=(const Location &rhs) const { return !(*this == rhs); }
-
-		struct Hash
-		{
-			std::size_t operator()(const Location &l) const noexcept
-			{
-				return FunctionLocation::Hash()(l.function) * 31 +
-				       std::hash<unsigned int>()(l.line);
-			}
-		};
-	};
-
-	using Backtrace = std::vector<Location>;
-
 	struct Pending
 	{
 		std::string name;

diff --git a/src/Reactor/ReactorDebugInfo.cpp b/src/Reactor/ReactorDebugInfo.cpp
new file mode 100644
index 0000000..246574d
--- /dev/null
+++ b/src/Reactor/ReactorDebugInfo.cpp

@@ -0,0 +1,105 @@
+// Copyright 2020 The SwiftShader Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//  http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "ReactorDebugInfo.hpp"
+#include "Print.hpp"
+
+#ifdef ENABLE_RR_DEBUG_INFO
+
+#	include "boost/stacktrace.hpp"
+
+#	include <algorithm>
+
+namespace rr {
+
+namespace {
+std::string to_lower(std::string str)
+{
+	std::transform(str.begin(), str.end(), str.begin(),
+	               [](unsigned char c) { return std::tolower(c); });
+	return str;
+}
+
+bool endswith_lower(const std::string &str, const std::string &suffix)
+{
+	size_t strLen = str.size();
+	size_t suffixLen = suffix.size();
+
+	if(strLen < suffixLen)
+	{
+		return false;
+	}
+
+	return to_lower(str).substr(strLen - suffixLen) == to_lower(suffix);
+}
+}  // namespace
+
+Backtrace getCallerBacktrace(size_t limit /* = 0 */)
+{
+	auto shouldSkipFile = [](const std::string &fileSR) {
+		return fileSR.empty() ||
+		       endswith_lower(fileSR, "ReactorDebugInfo.cpp") ||
+		       endswith_lower(fileSR, "Reactor.cpp") ||
+		       endswith_lower(fileSR, "Reactor.hpp") ||
+		       endswith_lower(fileSR, "Traits.hpp") ||
+		       endswith_lower(fileSR, "stacktrace.hpp");
+	};
+
+	std::vector<Location> locations;
+
+	// Note that bs::stacktrace() effectively returns a vector of addresses; bs::frame construction is where
+	// the heavy lifting is done: resolving the function name, file and line number.
+	namespace bs = boost::stacktrace;
+	for(bs::frame frame : bs::stacktrace())
+	{
+		if(shouldSkipFile(frame.source_file()))
+		{
+			continue;
+		}
+
+		Location location;
+		location.function.file = frame.source_file();
+		location.function.name = frame.name();
+		location.line = frame.source_line();
+		locations.push_back(location);
+
+		if(limit > 0 && locations.size() >= limit)
+		{
+			break;
+		}
+	}
+
+	std::reverse(locations.begin(), locations.end());
+
+	return locations;
+}
+
+void emitPrintLocation(const Backtrace &backtrace)
+{
+	static Location lastLocation;
+	if(backtrace.size() == 0)
+	{
+		return;
+	}
+	Location currLocation = backtrace[backtrace.size() - 1];
+	if(currLocation != lastLocation)
+	{
+		rr::Print("rr> {0} [{1}:{2}]\n", currLocation.function.name.c_str(), currLocation.function.file.c_str(), currLocation.line);
+		lastLocation = std::move(currLocation);
+	}
+}
+
+}  // namespace rr
+
+#endif  // ENABLE_RR_DEBUG_INFO

diff --git a/src/Reactor/ReactorDebugInfo.hpp b/src/Reactor/ReactorDebugInfo.hpp
new file mode 100644
index 0000000..7f63093
--- /dev/null
+++ b/src/Reactor/ReactorDebugInfo.hpp

@@ -0,0 +1,75 @@
+// Copyright 2020 The SwiftShader Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//  http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef rr_ReactorDebugInfo_hpp
+#define rr_ReactorDebugInfo_hpp
+
+#ifdef ENABLE_RR_DEBUG_INFO
+
+#	include <vector>
+#	include <string>
+
+namespace rr {
+
+struct FunctionLocation
+{
+	std::string name;
+	std::string file;
+
+	bool operator==(const FunctionLocation &rhs) const { return name == rhs.name && file == rhs.file; }
+	bool operator!=(const FunctionLocation &rhs) const { return !(*this == rhs); }
+
+	struct Hash
+	{
+		std::size_t operator()(const FunctionLocation &l) const noexcept
+		{
+			return std::hash<std::string>()(l.file) * 31 +
+			       std::hash<std::string>()(l.name);
+		}
+	};
+};
+
+struct Location
+{
+	FunctionLocation function;
+	unsigned int line = 0;
+
+	bool operator==(const Location &rhs) const { return function == rhs.function && line == rhs.line; }
+	bool operator!=(const Location &rhs) const { return !(*this == rhs); }
+
+	struct Hash
+	{
+		std::size_t operator()(const Location &l) const noexcept
+		{
+			return FunctionLocation::Hash()(l.function) * 31 +
+			       std::hash<unsigned int>()(l.line);
+		}
+	};
+};
+
+using Backtrace = std::vector<Location>;
+
+// Returns the backtrace for the callstack, starting at the first
+// non-Reactor file. If limit is non-zero, then a maximum of limit
+// frames will be returned.
+Backtrace getCallerBacktrace(size_t limit = 0);
+
+// Emits a print location for the top of the input backtrace.
+void emitPrintLocation(const Backtrace &backtrace);
+
+}  // namespace rr
+
+#endif  // ENABLE_RR_DEBUG_INFO
+
+#endif  // rr_ReactorDebugInfo_hpp

diff --git a/src/Reactor/SubzeroReactor.cpp b/src/Reactor/SubzeroReactor.cpp
index 29aa1c8..e3d8e11 100644
--- a/src/Reactor/SubzeroReactor.cpp
+++ b/src/Reactor/SubzeroReactor.cpp

@@ -16,6 +16,7 @@
 #include "EmulatedReactor.hpp"
 #include "Print.hpp"
 #include "Reactor.hpp"
+#include "ReactorDebugInfo.hpp"
 
 #include "ExecutableMemory.hpp"
 #include "Optimizer.hpp"
@@ -1068,6 +1069,8 @@
 
 void Nucleus::createRetVoid()
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
+
 	// Code generated after this point is unreachable, so any variables
 	// being read can safely return an undefined value. We have to avoid
 	// materializing variables after the terminator ret instruction.
@@ -1079,6 +1082,8 @@
 
 void Nucleus::createRet(Value *v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
+
 	// Code generated after this point is unreachable, so any variables
 	// being read can safely return an undefined value. We have to avoid
 	// materializing variables after the terminator ret instruction.
@@ -1090,6 +1095,7 @@
 
 void Nucleus::createBr(BasicBlock *dest)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Variable::materializeAll();
 
 	auto br = Ice::InstBr::create(::function, dest);
@@ -1098,6 +1104,7 @@
 
 void Nucleus::createCondBr(Value *cond, BasicBlock *ifTrue, BasicBlock *ifFalse)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Variable::materializeAll();
 
 	auto br = Ice::InstBr::create(::function, cond, ifTrue, ifFalse);
@@ -1136,61 +1143,73 @@
 
 Value *Nucleus::createAdd(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Add, lhs, rhs);
 }
 
 Value *Nucleus::createSub(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Sub, lhs, rhs);
 }
 
 Value *Nucleus::createMul(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Mul, lhs, rhs);
 }
 
 Value *Nucleus::createUDiv(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Udiv, lhs, rhs);
 }
 
 Value *Nucleus::createSDiv(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Sdiv, lhs, rhs);
 }
 
 Value *Nucleus::createFAdd(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Fadd, lhs, rhs);
 }
 
 Value *Nucleus::createFSub(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Fsub, lhs, rhs);
 }
 
 Value *Nucleus::createFMul(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Fmul, lhs, rhs);
 }
 
 Value *Nucleus::createFDiv(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Fdiv, lhs, rhs);
 }
 
 Value *Nucleus::createURem(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Urem, lhs, rhs);
 }
 
 Value *Nucleus::createSRem(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Srem, lhs, rhs);
 }
 
 Value *Nucleus::createFRem(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	// TODO(b/148139679) Fix Subzero generating invalid code for FRem on vector types
 	// createArithmetic(Ice::InstArithmetic::Frem, lhs, rhs);
 	UNIMPLEMENTED("b/148139679 Nucleus::createFRem");
@@ -1204,41 +1223,49 @@
 
 Value *Nucleus::createShl(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Shl, lhs, rhs);
 }
 
 Value *Nucleus::createLShr(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Lshr, lhs, rhs);
 }
 
 Value *Nucleus::createAShr(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Ashr, lhs, rhs);
 }
 
 Value *Nucleus::createAnd(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::And, lhs, rhs);
 }
 
 Value *Nucleus::createOr(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Or, lhs, rhs);
 }
 
 Value *Nucleus::createXor(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createArithmetic(Ice::InstArithmetic::Xor, lhs, rhs);
 }
 
 Value *Nucleus::createNeg(Value *v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createSub(createNullValue(T(v->getType())), v);
 }
 
 Value *Nucleus::createFNeg(Value *v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	double c[4] = { -0.0, -0.0, -0.0, -0.0 };
 	Value *negativeZero = Ice::isVectorType(v->getType()) ? createConstantVector(c, T(v->getType())) : V(::context->getConstantFloat(-0.0f));
 
@@ -1247,6 +1274,7 @@
 
 Value *Nucleus::createNot(Value *v)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(Ice::isScalarIntegerType(v->getType()))
 	{
 		return createXor(v, V(::context->getConstantInt(v->getType(), -1)));
@@ -1260,6 +1288,8 @@
 
 Value *Nucleus::createLoad(Value *ptr, Type *type, bool isVolatile, unsigned int align, bool atomic, std::memory_order memoryOrder)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
+
 	ASSERT(!atomic);                                   // Unimplemented
 	ASSERT(memoryOrder == std::memory_order_relaxed);  // Unimplemented
 
@@ -1321,6 +1351,8 @@
 
 Value *Nucleus::createStore(Value *value, Value *ptr, Type *type, bool isVolatile, unsigned int align, bool atomic, std::memory_order memoryOrder)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
+
 	ASSERT(!atomic);                                   // Unimplemented
 	ASSERT(memoryOrder == std::memory_order_relaxed);  // Unimplemented
 
@@ -1394,6 +1426,7 @@
 
 Value *Nucleus::createGEP(Value *ptr, Type *type, Value *index, bool unsignedIndex)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	ASSERT(index->getType() == Ice::IceType_i32);
 
 	if(auto *constant = llvm::dyn_cast<Ice::ConstantInteger32>(index))
@@ -1448,36 +1481,43 @@
 
 Value *Nucleus::createAtomicAdd(Value *ptr, Value *value, std::memory_order memoryOrder)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createAtomicRMW(Ice::Intrinsics::AtomicAdd, ptr, value, memoryOrder);
 }
 
 Value *Nucleus::createAtomicSub(Value *ptr, Value *value, std::memory_order memoryOrder)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createAtomicRMW(Ice::Intrinsics::AtomicSub, ptr, value, memoryOrder);
 }
 
 Value *Nucleus::createAtomicAnd(Value *ptr, Value *value, std::memory_order memoryOrder)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createAtomicRMW(Ice::Intrinsics::AtomicAnd, ptr, value, memoryOrder);
 }
 
 Value *Nucleus::createAtomicOr(Value *ptr, Value *value, std::memory_order memoryOrder)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createAtomicRMW(Ice::Intrinsics::AtomicOr, ptr, value, memoryOrder);
 }
 
 Value *Nucleus::createAtomicXor(Value *ptr, Value *value, std::memory_order memoryOrder)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createAtomicRMW(Ice::Intrinsics::AtomicXor, ptr, value, memoryOrder);
 }
 
 Value *Nucleus::createAtomicExchange(Value *ptr, Value *value, std::memory_order memoryOrder)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createAtomicRMW(Ice::Intrinsics::AtomicExchange, ptr, value, memoryOrder);
 }
 
 Value *Nucleus::createAtomicCompareExchange(Value *ptr, Value *value, Value *compare, std::memory_order memoryOrderEqual, std::memory_order memoryOrderUnequal)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Ice::Variable *result = ::function->makeVariable(value->getType());
 
 	const Ice::Intrinsics::IntrinsicInfo intrinsic = { Ice::Intrinsics::AtomicCmpxchg, Ice::Intrinsics::SideEffects_T, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_T };
@@ -1511,46 +1551,55 @@
 
 Value *Nucleus::createTrunc(Value *v, Type *destType)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createCast(Ice::InstCast::Trunc, v, destType);
 }
 
 Value *Nucleus::createZExt(Value *v, Type *destType)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createCast(Ice::InstCast::Zext, v, destType);
 }
 
 Value *Nucleus::createSExt(Value *v, Type *destType)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createCast(Ice::InstCast::Sext, v, destType);
 }
 
 Value *Nucleus::createFPToUI(Value *v, Type *destType)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createCast(Ice::InstCast::Fptoui, v, destType);
 }
 
 Value *Nucleus::createFPToSI(Value *v, Type *destType)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createCast(Ice::InstCast::Fptosi, v, destType);
 }
 
 Value *Nucleus::createSIToFP(Value *v, Type *destType)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createCast(Ice::InstCast::Sitofp, v, destType);
 }
 
 Value *Nucleus::createFPTrunc(Value *v, Type *destType)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createCast(Ice::InstCast::Fptrunc, v, destType);
 }
 
 Value *Nucleus::createFPExt(Value *v, Type *destType)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createCast(Ice::InstCast::Fpext, v, destType);
 }
 
 Value *Nucleus::createBitCast(Value *v, Type *destType)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	// Bitcasts must be between types of the same logical size. But with emulated narrow vectors we need
 	// support for casting between scalars and wide vectors. For platforms where this is not supported,
 	// emulate them by writing to the stack and reading back as the destination type.
@@ -1586,56 +1635,67 @@
 
 Value *Nucleus::createPtrEQ(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createIntCompare(Ice::InstIcmp::Eq, lhs, rhs);
 }
 
 Value *Nucleus::createICmpEQ(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createIntCompare(Ice::InstIcmp::Eq, lhs, rhs);
 }
 
 Value *Nucleus::createICmpNE(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createIntCompare(Ice::InstIcmp::Ne, lhs, rhs);
 }
 
 Value *Nucleus::createICmpUGT(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createIntCompare(Ice::InstIcmp::Ugt, lhs, rhs);
 }
 
 Value *Nucleus::createICmpUGE(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createIntCompare(Ice::InstIcmp::Uge, lhs, rhs);
 }
 
 Value *Nucleus::createICmpULT(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createIntCompare(Ice::InstIcmp::Ult, lhs, rhs);
 }
 
 Value *Nucleus::createICmpULE(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createIntCompare(Ice::InstIcmp::Ule, lhs, rhs);
 }
 
 Value *Nucleus::createICmpSGT(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createIntCompare(Ice::InstIcmp::Sgt, lhs, rhs);
 }
 
 Value *Nucleus::createICmpSGE(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createIntCompare(Ice::InstIcmp::Sge, lhs, rhs);
 }
 
 Value *Nucleus::createICmpSLT(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createIntCompare(Ice::InstIcmp::Slt, lhs, rhs);
 }
 
 Value *Nucleus::createICmpSLE(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createIntCompare(Ice::InstIcmp::Sle, lhs, rhs);
 }
 
@@ -1653,76 +1713,91 @@
 
 Value *Nucleus::createFCmpOEQ(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createFloatCompare(Ice::InstFcmp::Oeq, lhs, rhs);
 }
 
 Value *Nucleus::createFCmpOGT(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createFloatCompare(Ice::InstFcmp::Ogt, lhs, rhs);
 }
 
 Value *Nucleus::createFCmpOGE(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createFloatCompare(Ice::InstFcmp::Oge, lhs, rhs);
 }
 
 Value *Nucleus::createFCmpOLT(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createFloatCompare(Ice::InstFcmp::Olt, lhs, rhs);
 }
 
 Value *Nucleus::createFCmpOLE(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createFloatCompare(Ice::InstFcmp::Ole, lhs, rhs);
 }
 
 Value *Nucleus::createFCmpONE(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createFloatCompare(Ice::InstFcmp::One, lhs, rhs);
 }
 
 Value *Nucleus::createFCmpORD(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createFloatCompare(Ice::InstFcmp::Ord, lhs, rhs);
 }
 
 Value *Nucleus::createFCmpUNO(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createFloatCompare(Ice::InstFcmp::Uno, lhs, rhs);
 }
 
 Value *Nucleus::createFCmpUEQ(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createFloatCompare(Ice::InstFcmp::Ueq, lhs, rhs);
 }
 
 Value *Nucleus::createFCmpUGT(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createFloatCompare(Ice::InstFcmp::Ugt, lhs, rhs);
 }
 
 Value *Nucleus::createFCmpUGE(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createFloatCompare(Ice::InstFcmp::Uge, lhs, rhs);
 }
 
 Value *Nucleus::createFCmpULT(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createFloatCompare(Ice::InstFcmp::Ult, lhs, rhs);
 }
 
 Value *Nucleus::createFCmpULE(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createFloatCompare(Ice::InstFcmp::Ule, lhs, rhs);
 }
 
 Value *Nucleus::createFCmpUNE(Value *lhs, Value *rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createFloatCompare(Ice::InstFcmp::Une, lhs, rhs);
 }
 
 Value *Nucleus::createExtractElement(Value *vector, Type *type, int index)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto result = ::function->makeVariable(T(type));
 	auto extract = Ice::InstExtractElement::create(::function, result, V(vector), ::context->getConstantInt32(index));
 	::basicBlock->appendInst(extract);
@@ -1732,6 +1807,7 @@
 
 Value *Nucleus::createInsertElement(Value *vector, Value *element, int index)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto result = ::function->makeVariable(vector->getType());
 	auto insert = Ice::InstInsertElement::create(::function, result, vector, element, ::context->getConstantInt32(index));
 	::basicBlock->appendInst(insert);
@@ -1741,6 +1817,7 @@
 
 Value *Nucleus::createShuffleVector(Value *V1, Value *V2, const int *select)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	ASSERT(V1->getType() == V2->getType());
 
 	int size = Ice::typeNumElements(V1->getType());
@@ -1759,6 +1836,7 @@
 
 Value *Nucleus::createSelect(Value *C, Value *ifTrue, Value *ifFalse)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	ASSERT(ifTrue->getType() == ifFalse->getType());
 
 	auto result = ::function->makeVariable(ifTrue->getType());
@@ -1770,6 +1848,7 @@
 
 SwitchCases *Nucleus::createSwitch(Value *control, BasicBlock *defaultBranch, unsigned numCases)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	auto switchInst = Ice::InstSwitch::create(::function, numCases, control, defaultBranch);
 	::basicBlock->appendInst(switchInst);
 
@@ -1778,11 +1857,13 @@
 
 void Nucleus::addSwitchCase(SwitchCases *switchCases, int label, BasicBlock *branch)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	switchCases->addBranch(label, label, branch);
 }
 
 void Nucleus::createUnreachable()
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Ice::InstUnreachable *unreachable = Ice::InstUnreachable::create(::function);
 	::basicBlock->appendInst(unreachable);
 }
@@ -1841,6 +1922,7 @@
 
 Value *Nucleus::createNullValue(Type *Ty)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(Ice::isVectorType(T(Ty)))
 	{
 		ASSERT(Ice::typeNumElements(T(Ty)) <= 16);
@@ -1855,51 +1937,61 @@
 
 Value *Nucleus::createConstantLong(int64_t i)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return V(::context->getConstantInt64(i));
 }
 
 Value *Nucleus::createConstantInt(int i)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return V(::context->getConstantInt32(i));
 }
 
 Value *Nucleus::createConstantInt(unsigned int i)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return V(::context->getConstantInt32(i));
 }
 
 Value *Nucleus::createConstantBool(bool b)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return V(::context->getConstantInt1(b));
 }
 
 Value *Nucleus::createConstantByte(signed char i)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return V(::context->getConstantInt8(i));
 }
 
 Value *Nucleus::createConstantByte(unsigned char i)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return V(::context->getConstantInt8(i));
 }
 
 Value *Nucleus::createConstantShort(short i)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return V(::context->getConstantInt16(i));
 }
 
 Value *Nucleus::createConstantShort(unsigned short i)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return V(::context->getConstantInt16(i));
 }
 
 Value *Nucleus::createConstantFloat(float x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return V(::context->getConstantFloat(x));
 }
 
 Value *Nucleus::createNullPointer(Type *Ty)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return createNullValue(T(sizeof(void *) == 8 ? Ice::IceType_i64 : Ice::IceType_i32));
 }
 
@@ -1910,6 +2002,7 @@
 
 Value *Nucleus::createConstantVector(const int64_t *constants, Type *type)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	const int vectorSize = 16;
 	ASSERT(Ice::typeWidthInBytes(T(type)) == vectorSize);
 	const int alignment = vectorSize;
@@ -2005,6 +2098,7 @@
 
 Value *Nucleus::createConstantString(const char *v)
 {
+	// NOTE: Do not call RR_DEBUG_INFO_UPDATE_LOC() here to avoid recursion when called from rr::Printv
 	return V(IceConstantData(v, strlen(v) + 1));
 }
 
@@ -2067,6 +2161,7 @@
 
 RValue<Byte8> AddSat(RValue<Byte8> x, RValue<Byte8> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Byte8 result;
@@ -2097,6 +2192,7 @@
 
 RValue<Byte8> SubSat(RValue<Byte8> x, RValue<Byte8> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Byte8 result;
@@ -2127,16 +2223,19 @@
 
 RValue<SByte> Extract(RValue<SByte8> val, int i)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<SByte>(Nucleus::createExtractElement(val.value, SByte::getType(), i));
 }
 
 RValue<SByte8> Insert(RValue<SByte8> val, RValue<SByte> element, int i)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<SByte8>(Nucleus::createInsertElement(val.value, element.value, i));
 }
 
 RValue<SByte8> operator>>(RValue<SByte8> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		SByte8 result;
@@ -2167,6 +2266,7 @@
 
 RValue<Int> SignMask(RValue<Byte8> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics || CPUID::ARM)
 	{
 		Byte8 xx = As<Byte8>(As<SByte8>(x) >> 7) & Byte8(0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80);
@@ -2192,6 +2292,7 @@
 
 RValue<Byte8> CmpEQ(RValue<Byte8> x, RValue<Byte8> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Byte8>(Nucleus::createICmpEQ(x.value, y.value));
 }
 
@@ -2212,11 +2313,13 @@
 
 RValue<SByte> SaturateSigned(RValue<Short> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return SByte(IfThenElse(Int(x) > 0x7F, Int(0x7F), IfThenElse(Int(x) < -0x80, Int(0x80), Int(x))));
 }
 
 RValue<SByte8> AddSat(RValue<SByte8> x, RValue<SByte8> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		SByte8 result;
@@ -2247,6 +2350,7 @@
 
 RValue<SByte8> SubSat(RValue<SByte8> x, RValue<SByte8> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		SByte8 result;
@@ -2277,6 +2381,7 @@
 
 RValue<Int> SignMask(RValue<SByte8> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics || CPUID::ARM)
 	{
 		SByte8 xx = (x >> 7) & SByte8(0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80);
@@ -2297,11 +2402,13 @@
 
 RValue<Byte8> CmpGT(RValue<SByte8> x, RValue<SByte8> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Byte8>(createIntCompare(Ice::InstIcmp::Sgt, x.value, y.value));
 }
 
 RValue<Byte8> CmpEQ(RValue<SByte8> x, RValue<SByte8> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Byte8>(Nucleus::createICmpEQ(x.value, y.value));
 }
 
@@ -2353,6 +2460,7 @@
 
 RValue<Short4> operator<<(RValue<Short4> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Short4 result;
@@ -2371,6 +2479,7 @@
 
 RValue<Short4> operator>>(RValue<Short4> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Short4 result;
@@ -2389,6 +2498,7 @@
 
 RValue<Short4> Max(RValue<Short4> x, RValue<Short4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v8i1);
 	auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Sle, condition, x.value, y.value);
 	::basicBlock->appendInst(cmp);
@@ -2402,6 +2512,7 @@
 
 RValue<Short4> Min(RValue<Short4> x, RValue<Short4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v8i1);
 	auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Sgt, condition, x.value, y.value);
 	::basicBlock->appendInst(cmp);
@@ -2415,11 +2526,13 @@
 
 RValue<Short> SaturateSigned(RValue<Int> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return Short(IfThenElse(x > 0x7FFF, Int(0x7FFF), IfThenElse(x < -0x8000, Int(0x8000), x)));
 }
 
 RValue<Short4> AddSat(RValue<Short4> x, RValue<Short4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Short4 result;
@@ -2446,6 +2559,7 @@
 
 RValue<Short4> SubSat(RValue<Short4> x, RValue<Short4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Short4 result;
@@ -2472,6 +2586,7 @@
 
 RValue<Short4> MulHigh(RValue<Short4> x, RValue<Short4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Short4 result;
@@ -2498,6 +2613,7 @@
 
 RValue<Int2> MulAdd(RValue<Short4> x, RValue<Short4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Int2 result;
@@ -2522,6 +2638,7 @@
 
 RValue<SByte8> PackSigned(RValue<Short4> x, RValue<Short4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		SByte8 result;
@@ -2552,6 +2669,7 @@
 
 RValue<Byte8> PackUnsigned(RValue<Short4> x, RValue<Short4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Byte8 result;
@@ -2582,11 +2700,13 @@
 
 RValue<Short4> CmpGT(RValue<Short4> x, RValue<Short4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Short4>(createIntCompare(Ice::InstIcmp::Sgt, x.value, y.value));
 }
 
 RValue<Short4> CmpEQ(RValue<Short4> x, RValue<Short4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Short4>(Nucleus::createICmpEQ(x.value, y.value));
 }
 
@@ -2635,7 +2755,9 @@
 
 RValue<UShort4> operator<<(RValue<UShort4> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
+
 	{
 		UShort4 result;
 		result = Insert(result, Extract(lhs, 0) << UShort(rhs), 0);
@@ -2653,6 +2775,7 @@
 
 RValue<UShort4> operator>>(RValue<UShort4> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		UShort4 result;
@@ -2671,6 +2794,7 @@
 
 RValue<UShort4> Max(RValue<UShort4> x, RValue<UShort4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v8i1);
 	auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Ule, condition, x.value, y.value);
 	::basicBlock->appendInst(cmp);
@@ -2697,11 +2821,13 @@
 
 RValue<UShort> SaturateUnsigned(RValue<Int> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return UShort(IfThenElse(x > 0xFFFF, Int(0xFFFF), IfThenElse(x < 0, Int(0), x)));
 }
 
 RValue<UShort4> AddSat(RValue<UShort4> x, RValue<UShort4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		UShort4 result;
@@ -2728,6 +2854,7 @@
 
 RValue<UShort4> SubSat(RValue<UShort4> x, RValue<UShort4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		UShort4 result;
@@ -2754,6 +2881,7 @@
 
 RValue<UShort4> MulHigh(RValue<UShort4> x, RValue<UShort4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		UShort4 result;
@@ -2780,6 +2908,7 @@
 
 RValue<Int4> MulHigh(RValue<Int4> x, RValue<Int4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	// TODO: For x86, build an intrinsics version of this which uses shuffles + pmuludq.
 
 	// Scalarized implementation.
@@ -2794,6 +2923,7 @@
 
 RValue<UInt4> MulHigh(RValue<UInt4> x, RValue<UInt4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	// TODO: For x86, build an intrinsics version of this which uses shuffles + pmuludq.
 
 	if(false)  // Partial product based implementation.
@@ -2826,6 +2956,7 @@
 
 RValue<UShort4> Average(RValue<UShort4> x, RValue<UShort4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	UNIMPLEMENTED_NO_BUG("RValue<UShort4> Average(RValue<UShort4> x, RValue<UShort4> y)");
 	return UShort4(0);
 }
@@ -2837,16 +2968,19 @@
 
 RValue<Short> Extract(RValue<Short8> val, int i)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Short>(Nucleus::createExtractElement(val.value, Short::getType(), i));
 }
 
 RValue<Short8> Insert(RValue<Short8> val, RValue<Short> element, int i)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Short8>(Nucleus::createInsertElement(val.value, element.value, i));
 }
 
 RValue<Short8> operator<<(RValue<Short8> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Short8 result;
@@ -2869,6 +3003,7 @@
 
 RValue<Short8> operator>>(RValue<Short8> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Short8 result;
@@ -2891,12 +3026,14 @@
 
 RValue<Int4> MulAdd(RValue<Short8> x, RValue<Short8> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	UNIMPLEMENTED_NO_BUG("RValue<Int4> MulAdd(RValue<Short8> x, RValue<Short8> y)");
 	return Int4(0);
 }
 
 RValue<Short8> MulHigh(RValue<Short8> x, RValue<Short8> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	UNIMPLEMENTED_NO_BUG("RValue<Short8> MulHigh(RValue<Short8> x, RValue<Short8> y)");
 	return Short8(0);
 }
@@ -2908,16 +3045,19 @@
 
 RValue<UShort> Extract(RValue<UShort8> val, int i)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<UShort>(Nucleus::createExtractElement(val.value, UShort::getType(), i));
 }
 
 RValue<UShort8> Insert(RValue<UShort8> val, RValue<UShort> element, int i)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<UShort8>(Nucleus::createInsertElement(val.value, element.value, i));
 }
 
 RValue<UShort8> operator<<(RValue<UShort8> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		UShort8 result;
@@ -2940,6 +3080,7 @@
 
 RValue<UShort8> operator>>(RValue<UShort8> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		UShort8 result;
@@ -2962,6 +3103,7 @@
 
 RValue<UShort8> MulHigh(RValue<UShort8> x, RValue<UShort8> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	UNIMPLEMENTED_NO_BUG("RValue<UShort8> MulHigh(RValue<UShort8> x, RValue<UShort8> y)");
 	return UShort8(0);
 }
@@ -2973,6 +3115,7 @@
 
 RValue<Int> operator++(Int &val, int)  // Post-increment
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	RValue<Int> res = val;
 	val += 1;
 	return res;
@@ -2980,12 +3123,14 @@
 
 const Int &operator++(Int &val)  // Pre-increment
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	val += 1;
 	return val;
 }
 
 RValue<Int> operator--(Int &val, int)  // Post-decrement
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	RValue<Int> res = val;
 	val -= 1;
 	return res;
@@ -2993,12 +3138,14 @@
 
 const Int &operator--(Int &val)  // Pre-decrement
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	val -= 1;
 	return val;
 }
 
 RValue<Int> RoundInt(RValue<Float> cast)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics || CPUID::ARM)
 	{
 		// Push the fractional part off the mantissa. Accurate up to +/-2^22.
@@ -3029,6 +3176,7 @@
 
 UInt::UInt(RValue<Float> cast)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	// Smallest positive value representable in UInt, but not in Int
 	const unsigned int ustart = 0x80000000u;
 	const float ustartf = float(ustart);
@@ -3046,6 +3194,7 @@
 
 RValue<UInt> operator++(UInt &val, int)  // Post-increment
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	RValue<UInt> res = val;
 	val += 1;
 	return res;
@@ -3053,12 +3202,14 @@
 
 const UInt &operator++(UInt &val)  // Pre-increment
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	val += 1;
 	return val;
 }
 
 RValue<UInt> operator--(UInt &val, int)  // Post-decrement
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	RValue<UInt> res = val;
 	val -= 1;
 	return res;
@@ -3066,6 +3217,7 @@
 
 const UInt &operator--(UInt &val)  // Pre-decrement
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	val -= 1;
 	return val;
 }
@@ -3096,6 +3248,7 @@
 
 RValue<Int2> operator<<(RValue<Int2> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Int2 result;
@@ -3112,6 +3265,7 @@
 
 RValue<Int2> operator>>(RValue<Int2> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Int2 result;
@@ -3133,6 +3287,7 @@
 
 RValue<UInt2> operator<<(RValue<UInt2> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		UInt2 result;
@@ -3149,6 +3304,7 @@
 
 RValue<UInt2> operator>>(RValue<UInt2> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		UInt2 result;
@@ -3171,6 +3327,7 @@
 Int4::Int4(RValue<Byte4> cast)
     : XYZW(this)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Value *x = Nucleus::createBitCast(cast.value, Int::getType());
 	Value *a = Nucleus::createInsertElement(loadValue(), x, 0);
 
@@ -3190,6 +3347,7 @@
 Int4::Int4(RValue<SByte4> cast)
     : XYZW(this)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Value *x = Nucleus::createBitCast(cast.value, Int::getType());
 	Value *a = Nucleus::createInsertElement(loadValue(), x, 0);
 
@@ -3207,6 +3365,7 @@
 Int4::Int4(RValue<Short4> cast)
     : XYZW(this)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	int swizzle[8] = { 0, 0, 1, 1, 2, 2, 3, 3 };
 	Value *c = Nucleus::createShuffleVector(cast.value, cast.value, swizzle);
 
@@ -3216,6 +3375,7 @@
 Int4::Int4(RValue<UShort4> cast)
     : XYZW(this)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	int swizzle[8] = { 0, 8, 1, 9, 2, 10, 3, 11 };
 	Value *c = Nucleus::createShuffleVector(cast.value, Short8(0, 0, 0, 0, 0, 0, 0, 0).loadValue(), swizzle);
 	Value *d = Nucleus::createBitCast(c, Int4::getType());
@@ -3225,6 +3385,7 @@
 Int4::Int4(RValue<Int> rhs)
     : XYZW(this)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Value *vector = Nucleus::createBitCast(rhs.value, Int4::getType());
 
 	int swizzle[4] = { 0, 0, 0, 0 };
@@ -3235,6 +3396,7 @@
 
 RValue<Int4> operator<<(RValue<Int4> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Int4 result;
@@ -3253,6 +3415,7 @@
 
 RValue<Int4> operator>>(RValue<Int4> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Int4 result;
@@ -3271,36 +3434,43 @@
 
 RValue<Int4> CmpEQ(RValue<Int4> x, RValue<Int4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createICmpEQ(x.value, y.value));
 }
 
 RValue<Int4> CmpLT(RValue<Int4> x, RValue<Int4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createICmpSLT(x.value, y.value));
 }
 
 RValue<Int4> CmpLE(RValue<Int4> x, RValue<Int4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createICmpSLE(x.value, y.value));
 }
 
 RValue<Int4> CmpNEQ(RValue<Int4> x, RValue<Int4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createICmpNE(x.value, y.value));
 }
 
 RValue<Int4> CmpNLT(RValue<Int4> x, RValue<Int4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createICmpSGE(x.value, y.value));
 }
 
 RValue<Int4> CmpNLE(RValue<Int4> x, RValue<Int4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createICmpSGT(x.value, y.value));
 }
 
 RValue<Int4> Max(RValue<Int4> x, RValue<Int4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
 	auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Sle, condition, x.value, y.value);
 	::basicBlock->appendInst(cmp);
@@ -3314,6 +3484,7 @@
 
 RValue<Int4> Min(RValue<Int4> x, RValue<Int4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
 	auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Sgt, condition, x.value, y.value);
 	::basicBlock->appendInst(cmp);
@@ -3327,6 +3498,7 @@
 
 RValue<Int4> RoundInt(RValue<Float4> cast)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics || CPUID::ARM)
 	{
 		// Push the fractional part off the mantissa. Accurate up to +/-2^22.
@@ -3347,6 +3519,7 @@
 
 RValue<Short8> PackSigned(RValue<Int4> x, RValue<Int4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		Short8 result;
@@ -3377,6 +3550,7 @@
 
 RValue<UShort8> PackUnsigned(RValue<Int4> x, RValue<Int4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics || !(CPUID::SSE4_1 || CPUID::ARM))
 	{
 		RValue<Int4> sx = As<Int4>(x);
@@ -3403,6 +3577,7 @@
 
 RValue<Int> SignMask(RValue<Int4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics || CPUID::ARM)
 	{
 		Int4 xx = (x >> 31) & Int4(0x00000001, 0x00000002, 0x00000004, 0x00000008);
@@ -3429,6 +3604,7 @@
 UInt4::UInt4(RValue<Float4> cast)
     : XYZW(this)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	// Smallest positive value representable in UInt, but not in Int
 	const unsigned int ustart = 0x80000000u;
 	const float ustartf = float(ustart);
@@ -3446,6 +3622,7 @@
 UInt4::UInt4(RValue<UInt> rhs)
     : XYZW(this)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Value *vector = Nucleus::createBitCast(rhs.value, UInt4::getType());
 
 	int swizzle[4] = { 0, 0, 0, 0 };
@@ -3456,6 +3633,7 @@
 
 RValue<UInt4> operator<<(RValue<UInt4> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		UInt4 result;
@@ -3474,6 +3652,7 @@
 
 RValue<UInt4> operator>>(RValue<UInt4> lhs, unsigned char rhs)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		UInt4 result;
@@ -3492,36 +3671,43 @@
 
 RValue<UInt4> CmpEQ(RValue<UInt4> x, RValue<UInt4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<UInt4>(Nucleus::createICmpEQ(x.value, y.value));
 }
 
 RValue<UInt4> CmpLT(RValue<UInt4> x, RValue<UInt4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<UInt4>(Nucleus::createICmpULT(x.value, y.value));
 }
 
 RValue<UInt4> CmpLE(RValue<UInt4> x, RValue<UInt4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<UInt4>(Nucleus::createICmpULE(x.value, y.value));
 }
 
 RValue<UInt4> CmpNEQ(RValue<UInt4> x, RValue<UInt4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<UInt4>(Nucleus::createICmpNE(x.value, y.value));
 }
 
 RValue<UInt4> CmpNLT(RValue<UInt4> x, RValue<UInt4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<UInt4>(Nucleus::createICmpUGE(x.value, y.value));
 }
 
 RValue<UInt4> CmpNLE(RValue<UInt4> x, RValue<UInt4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<UInt4>(Nucleus::createICmpUGT(x.value, y.value));
 }
 
 RValue<UInt4> Max(RValue<UInt4> x, RValue<UInt4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
 	auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Ule, condition, x.value, y.value);
 	::basicBlock->appendInst(cmp);
@@ -3535,6 +3721,7 @@
 
 RValue<UInt4> Min(RValue<UInt4> x, RValue<UInt4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
 	auto cmp = Ice::InstIcmp::create(::function, Ice::InstIcmp::Ugt, condition, x.value, y.value);
 	::basicBlock->appendInst(cmp);
@@ -3558,16 +3745,19 @@
 
 RValue<Float> Rcp_pp(RValue<Float> x, bool exactAtPow2)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return 1.0f / x;
 }
 
 RValue<Float> RcpSqrt_pp(RValue<Float> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return Rcp_pp(Sqrt(x));
 }
 
 RValue<Float> Sqrt(RValue<Float> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Ice::Variable *result = ::function->makeVariable(Ice::IceType_f32);
 	const Ice::Intrinsics::IntrinsicInfo intrinsic = { Ice::Intrinsics::Sqrt, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F };
 	auto target = ::context->getConstantUndef(Ice::IceType_i32);
@@ -3580,26 +3770,31 @@
 
 RValue<Float> Round(RValue<Float> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return Float4(Round(Float4(x))).x;
 }
 
 RValue<Float> Trunc(RValue<Float> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return Float4(Trunc(Float4(x))).x;
 }
 
 RValue<Float> Frac(RValue<Float> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return Float4(Frac(Float4(x))).x;
 }
 
 RValue<Float> Floor(RValue<Float> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return Float4(Floor(Float4(x))).x;
 }
 
 RValue<Float> Ceil(RValue<Float> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return Float4(Ceil(Float4(x))).x;
 }
 
@@ -3616,6 +3811,7 @@
 Float4::Float4(RValue<Float> rhs)
     : XYZW(this)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Value *vector = Nucleus::createBitCast(rhs.value, Float4::getType());
 
 	int swizzle[4] = { 0, 0, 0, 0 };
@@ -3626,6 +3822,7 @@
 
 RValue<Float4> Max(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
 	auto cmp = Ice::InstFcmp::create(::function, Ice::InstFcmp::Ogt, condition, x.value, y.value);
 	::basicBlock->appendInst(cmp);
@@ -3639,6 +3836,7 @@
 
 RValue<Float4> Min(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Ice::Variable *condition = ::function->makeVariable(Ice::IceType_v4i1);
 	auto cmp = Ice::InstFcmp::create(::function, Ice::InstFcmp::Olt, condition, x.value, y.value);
 	::basicBlock->appendInst(cmp);
@@ -3652,16 +3850,19 @@
 
 RValue<Float4> Rcp_pp(RValue<Float4> x, bool exactAtPow2)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return Float4(1.0f) / x;
 }
 
 RValue<Float4> RcpSqrt_pp(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return Rcp_pp(Sqrt(x));
 }
 
 RValue<Float4> Sqrt(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics || CPUID::ARM)
 	{
 		Float4 result;
@@ -3687,6 +3888,7 @@
 
 RValue<Int> SignMask(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics || CPUID::ARM)
 	{
 		Int4 xx = (As<Int4>(x) >> 31) & Int4(0x00000001, 0x00000002, 0x00000004, 0x00000008);
@@ -3707,66 +3909,79 @@
 
 RValue<Int4> CmpEQ(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createFCmpOEQ(x.value, y.value));
 }
 
 RValue<Int4> CmpLT(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createFCmpOLT(x.value, y.value));
 }
 
 RValue<Int4> CmpLE(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createFCmpOLE(x.value, y.value));
 }
 
 RValue<Int4> CmpNEQ(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createFCmpONE(x.value, y.value));
 }
 
 RValue<Int4> CmpNLT(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createFCmpOGE(x.value, y.value));
 }
 
 RValue<Int4> CmpNLE(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createFCmpOGT(x.value, y.value));
 }
 
 RValue<Int4> CmpUEQ(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createFCmpUEQ(x.value, y.value));
 }
 
 RValue<Int4> CmpULT(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createFCmpULT(x.value, y.value));
 }
 
 RValue<Int4> CmpULE(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createFCmpULE(x.value, y.value));
 }
 
 RValue<Int4> CmpUNEQ(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createFCmpUNE(x.value, y.value));
 }
 
 RValue<Int4> CmpUNLT(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createFCmpUGE(x.value, y.value));
 }
 
 RValue<Int4> CmpUNLE(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Int4>(Nucleus::createFCmpUGT(x.value, y.value));
 }
 
 RValue<Float4> Round(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics || CPUID::ARM)
 	{
 		// Push the fractional part off the mantissa. Accurate up to +/-2^22.
@@ -3792,6 +4007,7 @@
 
 RValue<Float4> Trunc(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(CPUID::SSE4_1)
 	{
 		Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
@@ -3812,6 +4028,7 @@
 
 RValue<Float4> Frac(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Float4 frc;
 
 	if(CPUID::SSE4_1)
@@ -3832,6 +4049,7 @@
 
 RValue<Float4> Floor(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(CPUID::SSE4_1)
 	{
 		Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
@@ -3852,6 +4070,7 @@
 
 RValue<Float4> Ceil(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(CPUID::SSE4_1)
 	{
 		Ice::Variable *result = ::function->makeVariable(Ice::IceType_v4f32);
@@ -3877,22 +4096,26 @@
 
 RValue<Long> Ticks()
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	UNIMPLEMENTED_NO_BUG("RValue<Long> Ticks()");
 	return Long(Int(0));
 }
 
 RValue<Pointer<Byte>> ConstantPointer(void const *ptr)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Pointer<Byte>>{ V(sz::getConstantPointer(::context, ptr)) };
 }
 
 RValue<Pointer<Byte>> ConstantData(void const *data, size_t size)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return RValue<Pointer<Byte>>{ V(IceConstantData(data, size)) };
 }
 
 Value *Call(RValue<Pointer<Byte>> fptr, Type *retTy, std::initializer_list<Value *> args, std::initializer_list<Type *> argTys)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Ice::Variable *ret = nullptr;
 	if(retTy != nullptr)
 	{
@@ -3909,6 +4132,7 @@
 
 void Breakpoint()
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	const Ice::Intrinsics::IntrinsicInfo intrinsic = { Ice::Intrinsics::Trap, Ice::Intrinsics::SideEffects_F, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F };
 	auto target = ::context->getConstantUndef(Ice::IceType_i32);
 	auto trap = Ice::InstIntrinsicCall::create(::function, 0, nullptr, target, intrinsic);
@@ -3917,6 +4141,7 @@
 
 void Nucleus::createFence(std::memory_order memoryOrder)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	const Ice::Intrinsics::IntrinsicInfo intrinsic = { Ice::Intrinsics::AtomicFence, Ice::Intrinsics::SideEffects_T, Ice::Intrinsics::ReturnsTwice_F, Ice::Intrinsics::MemoryWrite_F };
 	auto target = ::context->getConstantUndef(Ice::IceType_i32);
 	auto inst = Ice::InstIntrinsicCall::create(::function, 0, nullptr, target, intrinsic);
@@ -3927,136 +4152,163 @@
 
 Value *Nucleus::createMaskedLoad(Value *ptr, Type *elTy, Value *mask, unsigned int alignment, bool zeroMaskedLanes)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	UNIMPLEMENTED_NO_BUG("Subzero createMaskedLoad()");
 	return nullptr;
 }
 void Nucleus::createMaskedStore(Value *ptr, Value *val, Value *mask, unsigned int alignment)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	UNIMPLEMENTED_NO_BUG("Subzero createMaskedStore()");
 }
 
 RValue<Float4> Gather(RValue<Pointer<Float>> base, RValue<Int4> offsets, RValue<Int4> mask, unsigned int alignment, bool zeroMaskedLanes /* = false */)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Gather(base, offsets, mask, alignment, zeroMaskedLanes);
 }
 
 RValue<Int4> Gather(RValue<Pointer<Int>> base, RValue<Int4> offsets, RValue<Int4> mask, unsigned int alignment, bool zeroMaskedLanes /* = false */)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Gather(base, offsets, mask, alignment, zeroMaskedLanes);
 }
 
 void Scatter(RValue<Pointer<Float>> base, RValue<Float4> val, RValue<Int4> offsets, RValue<Int4> mask, unsigned int alignment)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Scatter(base, val, offsets, mask, alignment);
 }
 
 void Scatter(RValue<Pointer<Int>> base, RValue<Int4> val, RValue<Int4> offsets, RValue<Int4> mask, unsigned int alignment)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Scatter(base, val, offsets, mask, alignment);
 }
 
 RValue<Float> Exp2(RValue<Float> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Exp2(x);
 }
 
 RValue<Float> Log2(RValue<Float> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Log2(x);
 }
 
 RValue<Float4> Sin(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Sin(x);
 }
 
 RValue<Float4> Cos(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Cos(x);
 }
 
 RValue<Float4> Tan(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Tan(x);
 }
 
 RValue<Float4> Asin(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Asin(x);
 }
 
 RValue<Float4> Acos(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Acos(x);
 }
 
 RValue<Float4> Atan(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Atan(x);
 }
 
 RValue<Float4> Sinh(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Sinh(x);
 }
 
 RValue<Float4> Cosh(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Cosh(x);
 }
 
 RValue<Float4> Tanh(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Tanh(x);
 }
 
 RValue<Float4> Asinh(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Asinh(x);
 }
 
 RValue<Float4> Acosh(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Acosh(x);
 }
 
 RValue<Float4> Atanh(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Atanh(x);
 }
 
 RValue<Float4> Atan2(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Atan2(x, y);
 }
 
 RValue<Float4> Pow(RValue<Float4> x, RValue<Float4> y)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Pow(x, y);
 }
 
 RValue<Float4> Exp(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Exp(x);
 }
 
 RValue<Float4> Log(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Log(x);
 }
 
 RValue<Float4> Exp2(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Exp2(x);
 }
 
 RValue<Float4> Log2(RValue<Float4> x)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::Log2(x);
 }
 
 RValue<UInt> Ctlz(RValue<UInt> x, bool isZeroUndef)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		UNIMPLEMENTED_NO_BUG("Subzero Ctlz()");
@@ -4077,6 +4329,7 @@
 
 RValue<UInt4> Ctlz(RValue<UInt4> x, bool isZeroUndef)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		UNIMPLEMENTED_NO_BUG("Subzero Ctlz()");
@@ -4096,6 +4349,7 @@
 
 RValue<UInt> Cttz(RValue<UInt> x, bool isZeroUndef)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		UNIMPLEMENTED_NO_BUG("Subzero Cttz()");
@@ -4116,6 +4370,7 @@
 
 RValue<UInt4> Cttz(RValue<UInt4> x, bool isZeroUndef)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	if(emulateIntrinsics)
 	{
 		UNIMPLEMENTED_NO_BUG("Subzero Cttz()");
@@ -4135,25 +4390,36 @@
 
 RValue<Int> MinAtomic(RValue<Pointer<Int>> x, RValue<Int> y, std::memory_order memoryOrder)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::MinAtomic(x, y, memoryOrder);
 }
 
 RValue<UInt> MinAtomic(RValue<Pointer<UInt>> x, RValue<UInt> y, std::memory_order memoryOrder)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::MinAtomic(x, y, memoryOrder);
 }
 
 RValue<Int> MaxAtomic(RValue<Pointer<Int>> x, RValue<Int> y, std::memory_order memoryOrder)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::MaxAtomic(x, y, memoryOrder);
 }
 
 RValue<UInt> MaxAtomic(RValue<Pointer<UInt>> x, RValue<UInt> y, std::memory_order memoryOrder)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	return emulated::MaxAtomic(x, y, memoryOrder);
 }
 
-void EmitDebugLocation() {}
+void EmitDebugLocation()
+{
+#ifdef ENABLE_RR_DEBUG_INFO
+#	ifdef ENABLE_RR_EMIT_PRINT_LOCATION
+	emitPrintLocation(getCallerBacktrace());
+#	endif  // ENABLE_RR_EMIT_PRINT_LOCATION
+#endif      // ENABLE_RR_DEBUG_INFO
+}
 void EmitDebugVariable(Value *value) {}
 void FlushDebug() {}
 
@@ -4580,6 +4846,7 @@
 
 void Nucleus::yield(Value *val)
 {
+	RR_DEBUG_INFO_UPDATE_LOC();
 	Variable::materializeAll();
 
 	// On first yield, we start generating coroutine functions
commit	aae33735e69931106bed4a6d5a32bfcc4631dee2	[log] [tgz]
author	Antonio Maiorano <amaiorano@google.com>	Fri Feb 14 14:52:34 2020 -0500
committer	Antonio Maiorano <amaiorano@google.com>	Mon Feb 17 20:03:34 2020 +0000
tree	debba0ffa0fad4dc3f13bb0799468b58a1d9beed
parent	d42d2fd9c9e2212b4804b72867051be0d41c219f [diff]