third_party/llvm-7.0/llvm/lib/CodeGen/ExpandReductions.cpp - SwiftShader - Git at Google

 //===--- ExpandReductions.cpp - Expand experimental reduction intrinsics --===//
 //
 //                     The LLVM Compiler Infrastructure
 //
 // This file is distributed under the University of Illinois Open Source
 // License. See LICENSE.TXT for details.
 //
 //===----------------------------------------------------------------------===//
 //
 // This pass implements IR expansion for reduction intrinsics, allowing targets
 // to enable the experimental intrinsics until just before codegen.
 //
 //===----------------------------------------------------------------------===//

 #include "llvm/CodeGen/ExpandReductions.h"
 #include "llvm/Analysis/TargetTransformInfo.h"
 #include "llvm/CodeGen/Passes.h"
 #include "llvm/IR/Function.h"
 #include "llvm/IR/IRBuilder.h"
 #include "llvm/IR/InstIterator.h"
 #include "llvm/IR/IntrinsicInst.h"
 #include "llvm/IR/Intrinsics.h"
 #include "llvm/IR/Module.h"
 #include "llvm/Pass.h"
 #include "llvm/Transforms/Utils/LoopUtils.h"

 using namespace llvm;

 namespace {

 unsigned getOpcode(Intrinsic::ID ID) {
   switch (ID) {
   case Intrinsic::experimental_vector_reduce_fadd:
     return Instruction::FAdd;
   case Intrinsic::experimental_vector_reduce_fmul:
     return Instruction::FMul;
   case Intrinsic::experimental_vector_reduce_add:
     return Instruction::Add;
   case Intrinsic::experimental_vector_reduce_mul:
     return Instruction::Mul;
   case Intrinsic::experimental_vector_reduce_and:
     return Instruction::And;
   case Intrinsic::experimental_vector_reduce_or:
     return Instruction::Or;
   case Intrinsic::experimental_vector_reduce_xor:
     return Instruction::Xor;
   case Intrinsic::experimental_vector_reduce_smax:
   case Intrinsic::experimental_vector_reduce_smin:
   case Intrinsic::experimental_vector_reduce_umax:
   case Intrinsic::experimental_vector_reduce_umin:
     return Instruction::ICmp;
   case Intrinsic::experimental_vector_reduce_fmax:
   case Intrinsic::experimental_vector_reduce_fmin:
     return Instruction::FCmp;
   default:
     llvm_unreachable("Unexpected ID");
   }
 }

 RecurrenceDescriptor::MinMaxRecurrenceKind getMRK(Intrinsic::ID ID) {
   switch (ID) {
   case Intrinsic::experimental_vector_reduce_smax:
     return RecurrenceDescriptor::MRK_SIntMax;
   case Intrinsic::experimental_vector_reduce_smin:
     return RecurrenceDescriptor::MRK_SIntMin;
   case Intrinsic::experimental_vector_reduce_umax:
     return RecurrenceDescriptor::MRK_UIntMax;
   case Intrinsic::experimental_vector_reduce_umin:
     return RecurrenceDescriptor::MRK_UIntMin;
   case Intrinsic::experimental_vector_reduce_fmax:
     return RecurrenceDescriptor::MRK_FloatMax;
   case Intrinsic::experimental_vector_reduce_fmin:
     return RecurrenceDescriptor::MRK_FloatMin;
   default:
     return RecurrenceDescriptor::MRK_Invalid;
   }
 }

 bool expandReductions(Function &F, const TargetTransformInfo *TTI) {
   bool Changed = false;
   SmallVector<IntrinsicInst *, 4> Worklist;
   for (inst_iterator I = inst_begin(F), E = inst_end(F); I != E; ++I)
     if (auto II = dyn_cast<IntrinsicInst>(&*I))
       Worklist.push_back(II);

   for (auto *II : Worklist) {
     IRBuilder<> Builder(II);
     bool IsOrdered = false;
     Value *Acc = nullptr;
     Value *Vec = nullptr;
     auto ID = II->getIntrinsicID();
     auto MRK = RecurrenceDescriptor::MRK_Invalid;
     switch (ID) {
     case Intrinsic::experimental_vector_reduce_fadd:
     case Intrinsic::experimental_vector_reduce_fmul:
       // FMFs must be attached to the call, otherwise it's an ordered reduction
       // and it can't be handled by generating a shuffle sequence.
       if (!II->getFastMathFlags().isFast())
         IsOrdered = true;
       Acc = II->getArgOperand(0);
       Vec = II->getArgOperand(1);
       break;
     case Intrinsic::experimental_vector_reduce_add:
     case Intrinsic::experimental_vector_reduce_mul:
     case Intrinsic::experimental_vector_reduce_and:
     case Intrinsic::experimental_vector_reduce_or:
     case Intrinsic::experimental_vector_reduce_xor:
     case Intrinsic::experimental_vector_reduce_smax:
     case Intrinsic::experimental_vector_reduce_smin:
     case Intrinsic::experimental_vector_reduce_umax:
     case Intrinsic::experimental_vector_reduce_umin:
     case Intrinsic::experimental_vector_reduce_fmax:
     case Intrinsic::experimental_vector_reduce_fmin:
       Vec = II->getArgOperand(0);
       MRK = getMRK(ID);
       break;
     default:
       continue;
     }
     if (!TTI->shouldExpandReduction(II))
       continue;
     Value *Rdx =
         IsOrdered ? getOrderedReduction(Builder, Acc, Vec, getOpcode(ID), MRK)
                   : getShuffleReduction(Builder, Vec, getOpcode(ID), MRK);
     II->replaceAllUsesWith(Rdx);
     II->eraseFromParent();
     Changed = true;
   }
   return Changed;
 }

 class ExpandReductions : public FunctionPass {
 public:
   static char ID;
   ExpandReductions() : FunctionPass(ID) {
     initializeExpandReductionsPass(*PassRegistry::getPassRegistry());
   }

   bool runOnFunction(Function &F) override {
     const auto *TTI =&getAnalysis<TargetTransformInfoWrapperPass>().getTTI(F);
     return expandReductions(F, TTI);
   }

   void getAnalysisUsage(AnalysisUsage &AU) const override {
     AU.addRequired<TargetTransformInfoWrapperPass>();
     AU.setPreservesCFG();
   }
 };
 }

 char ExpandReductions::ID;
 INITIALIZE_PASS_BEGIN(ExpandReductions, "expand-reductions",
                       "Expand reduction intrinsics", false, false)
 INITIALIZE_PASS_DEPENDENCY(TargetTransformInfoWrapperPass)
 INITIALIZE_PASS_END(ExpandReductions, "expand-reductions",
                     "Expand reduction intrinsics", false, false)

 FunctionPass *llvm::createExpandReductionsPass() {
   return new ExpandReductions();
 }

 PreservedAnalyses ExpandReductionsPass::run(Function &F,
                                             FunctionAnalysisManager &AM) {
   const auto &TTI = AM.getResult<TargetIRAnalysis>(F);
   if (!expandReductions(F, &TTI))
     return PreservedAnalyses::all();
   PreservedAnalyses PA;
   PA.preserveSet<CFGAnalyses>();
   return PA;
 }
	//===--- ExpandReductions.cpp - Expand experimental reduction intrinsics --===//
	//
	// The LLVM Compiler Infrastructure
	//
	// This file is distributed under the University of Illinois Open Source
	// License. See LICENSE.TXT for details.
	//
	//===----------------------------------------------------------------------===//
	//
	// This pass implements IR expansion for reduction intrinsics, allowing targets
	// to enable the experimental intrinsics until just before codegen.
	//
	//===----------------------------------------------------------------------===//

	#include "llvm/CodeGen/ExpandReductions.h"
	#include "llvm/Analysis/TargetTransformInfo.h"
	#include "llvm/CodeGen/Passes.h"
	#include "llvm/IR/Function.h"
	#include "llvm/IR/IRBuilder.h"
	#include "llvm/IR/InstIterator.h"
	#include "llvm/IR/IntrinsicInst.h"
	#include "llvm/IR/Intrinsics.h"
	#include "llvm/IR/Module.h"
	#include "llvm/Pass.h"
	#include "llvm/Transforms/Utils/LoopUtils.h"

	using namespace llvm;

	namespace {

	unsigned getOpcode(Intrinsic::ID ID) {
	switch (ID) {
	case Intrinsic::experimental_vector_reduce_fadd:
	return Instruction::FAdd;
	case Intrinsic::experimental_vector_reduce_fmul:
	return Instruction::FMul;
	case Intrinsic::experimental_vector_reduce_add:
	return Instruction::Add;
	case Intrinsic::experimental_vector_reduce_mul:
	return Instruction::Mul;
	case Intrinsic::experimental_vector_reduce_and:
	return Instruction::And;
	case Intrinsic::experimental_vector_reduce_or:
	return Instruction::Or;
	case Intrinsic::experimental_vector_reduce_xor:
	return Instruction::Xor;
	case Intrinsic::experimental_vector_reduce_smax:
	case Intrinsic::experimental_vector_reduce_smin:
	case Intrinsic::experimental_vector_reduce_umax:
	case Intrinsic::experimental_vector_reduce_umin:
	return Instruction::ICmp;
	case Intrinsic::experimental_vector_reduce_fmax:
	case Intrinsic::experimental_vector_reduce_fmin:
	return Instruction::FCmp;
	default:
	llvm_unreachable("Unexpected ID");
	}
	}

	RecurrenceDescriptor::MinMaxRecurrenceKind getMRK(Intrinsic::ID ID) {
	switch (ID) {
	case Intrinsic::experimental_vector_reduce_smax:
	return RecurrenceDescriptor::MRK_SIntMax;
	case Intrinsic::experimental_vector_reduce_smin:
	return RecurrenceDescriptor::MRK_SIntMin;
	case Intrinsic::experimental_vector_reduce_umax:
	return RecurrenceDescriptor::MRK_UIntMax;
	case Intrinsic::experimental_vector_reduce_umin:
	return RecurrenceDescriptor::MRK_UIntMin;
	case Intrinsic::experimental_vector_reduce_fmax:
	return RecurrenceDescriptor::MRK_FloatMax;
	case Intrinsic::experimental_vector_reduce_fmin:
	return RecurrenceDescriptor::MRK_FloatMin;
	default:
	return RecurrenceDescriptor::MRK_Invalid;
	}
	}

	bool expandReductions(Function &F, const TargetTransformInfo *TTI) {
	bool Changed = false;
	SmallVector<IntrinsicInst *, 4> Worklist;
	for (inst_iterator I = inst_begin(F), E = inst_end(F); I != E; ++I)
	if (auto II = dyn_cast<IntrinsicInst>(&*I))
	Worklist.push_back(II);

	for (auto *II : Worklist) {
	IRBuilder<> Builder(II);
	bool IsOrdered = false;
	Value *Acc = nullptr;
	Value *Vec = nullptr;
	auto ID = II->getIntrinsicID();
	auto MRK = RecurrenceDescriptor::MRK_Invalid;
	switch (ID) {
	case Intrinsic::experimental_vector_reduce_fadd:
	case Intrinsic::experimental_vector_reduce_fmul:
	// FMFs must be attached to the call, otherwise it's an ordered reduction
	// and it can't be handled by generating a shuffle sequence.
	if (!II->getFastMathFlags().isFast())
	IsOrdered = true;
	Acc = II->getArgOperand(0);
	Vec = II->getArgOperand(1);
	break;
	case Intrinsic::experimental_vector_reduce_add:
	case Intrinsic::experimental_vector_reduce_mul:
	case Intrinsic::experimental_vector_reduce_and:
	case Intrinsic::experimental_vector_reduce_or:
	case Intrinsic::experimental_vector_reduce_xor:
	case Intrinsic::experimental_vector_reduce_smax:
	case Intrinsic::experimental_vector_reduce_smin:
	case Intrinsic::experimental_vector_reduce_umax:
	case Intrinsic::experimental_vector_reduce_umin:
	case Intrinsic::experimental_vector_reduce_fmax:
	case Intrinsic::experimental_vector_reduce_fmin:
	Vec = II->getArgOperand(0);
	MRK = getMRK(ID);
	break;
	default:
	continue;
	}
	if (!TTI->shouldExpandReduction(II))
	continue;
	Value *Rdx =
	IsOrdered ? getOrderedReduction(Builder, Acc, Vec, getOpcode(ID), MRK)
	: getShuffleReduction(Builder, Vec, getOpcode(ID), MRK);
	II->replaceAllUsesWith(Rdx);
	II->eraseFromParent();
	Changed = true;
	}
	return Changed;
	}

	class ExpandReductions : public FunctionPass {
	public:
	static char ID;
	ExpandReductions() : FunctionPass(ID) {
	initializeExpandReductionsPass(*PassRegistry::getPassRegistry());
	}

	bool runOnFunction(Function &F) override {
	const auto *TTI =&getAnalysis<TargetTransformInfoWrapperPass>().getTTI(F);
	return expandReductions(F, TTI);
	}

	void getAnalysisUsage(AnalysisUsage &AU) const override {
	AU.addRequired<TargetTransformInfoWrapperPass>();
	AU.setPreservesCFG();
	}
	};
	}

	char ExpandReductions::ID;
	INITIALIZE_PASS_BEGIN(ExpandReductions, "expand-reductions",
	"Expand reduction intrinsics", false, false)
	INITIALIZE_PASS_DEPENDENCY(TargetTransformInfoWrapperPass)
	INITIALIZE_PASS_END(ExpandReductions, "expand-reductions",
	"Expand reduction intrinsics", false, false)

	FunctionPass *llvm::createExpandReductionsPass() {
	return new ExpandReductions();
	}

	PreservedAnalyses ExpandReductionsPass::run(Function &F,
	FunctionAnalysisManager &AM) {
	const auto &TTI = AM.getResult<TargetIRAnalysis>(F);
	if (!expandReductions(F, &TTI))
	return PreservedAnalyses::all();
	PreservedAnalyses PA;
	PA.preserveSet<CFGAnalyses>();
	return PA;
	}