You've already forked linux-packaging-mono
							
							
		
			
	
	
		
			168 lines
		
	
	
		
			5.8 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
		
		
			
		
	
	
			168 lines
		
	
	
		
			5.8 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
|   | //===--- ExpandReductions.cpp - Expand experimental reduction intrinsics --===//
 | ||
|  | //
 | ||
|  | //                     The LLVM Compiler Infrastructure
 | ||
|  | //
 | ||
|  | // This file is distributed under the University of Illinois Open Source
 | ||
|  | // License. See LICENSE.TXT for details.
 | ||
|  | //
 | ||
|  | //===----------------------------------------------------------------------===//
 | ||
|  | //
 | ||
|  | // This pass implements IR expansion for reduction intrinsics, allowing targets
 | ||
|  | // to enable the experimental intrinsics until just before codegen.
 | ||
|  | //
 | ||
|  | //===----------------------------------------------------------------------===//
 | ||
|  | 
 | ||
|  | #include "llvm/CodeGen/ExpandReductions.h"
 | ||
|  | #include "llvm/Analysis/TargetTransformInfo.h"
 | ||
|  | #include "llvm/CodeGen/Passes.h"
 | ||
|  | #include "llvm/IR/Function.h"
 | ||
|  | #include "llvm/IR/IRBuilder.h"
 | ||
|  | #include "llvm/IR/InstIterator.h"
 | ||
|  | #include "llvm/IR/IntrinsicInst.h"
 | ||
|  | #include "llvm/IR/Intrinsics.h"
 | ||
|  | #include "llvm/IR/Module.h"
 | ||
|  | #include "llvm/Pass.h"
 | ||
|  | #include "llvm/Transforms/Utils/LoopUtils.h"
 | ||
|  | 
 | ||
|  | using namespace llvm; | ||
|  | 
 | ||
|  | namespace { | ||
|  | 
 | ||
|  | unsigned getOpcode(Intrinsic::ID ID) { | ||
|  |   switch (ID) { | ||
|  |   case Intrinsic::experimental_vector_reduce_fadd: | ||
|  |     return Instruction::FAdd; | ||
|  |   case Intrinsic::experimental_vector_reduce_fmul: | ||
|  |     return Instruction::FMul; | ||
|  |   case Intrinsic::experimental_vector_reduce_add: | ||
|  |     return Instruction::Add; | ||
|  |   case Intrinsic::experimental_vector_reduce_mul: | ||
|  |     return Instruction::Mul; | ||
|  |   case Intrinsic::experimental_vector_reduce_and: | ||
|  |     return Instruction::And; | ||
|  |   case Intrinsic::experimental_vector_reduce_or: | ||
|  |     return Instruction::Or; | ||
|  |   case Intrinsic::experimental_vector_reduce_xor: | ||
|  |     return Instruction::Xor; | ||
|  |   case Intrinsic::experimental_vector_reduce_smax: | ||
|  |   case Intrinsic::experimental_vector_reduce_smin: | ||
|  |   case Intrinsic::experimental_vector_reduce_umax: | ||
|  |   case Intrinsic::experimental_vector_reduce_umin: | ||
|  |     return Instruction::ICmp; | ||
|  |   case Intrinsic::experimental_vector_reduce_fmax: | ||
|  |   case Intrinsic::experimental_vector_reduce_fmin: | ||
|  |     return Instruction::FCmp; | ||
|  |   default: | ||
|  |     llvm_unreachable("Unexpected ID"); | ||
|  |   } | ||
|  | } | ||
|  | 
 | ||
|  | RecurrenceDescriptor::MinMaxRecurrenceKind getMRK(Intrinsic::ID ID) { | ||
|  |   switch (ID) { | ||
|  |   case Intrinsic::experimental_vector_reduce_smax: | ||
|  |     return RecurrenceDescriptor::MRK_SIntMax; | ||
|  |   case Intrinsic::experimental_vector_reduce_smin: | ||
|  |     return RecurrenceDescriptor::MRK_SIntMin; | ||
|  |   case Intrinsic::experimental_vector_reduce_umax: | ||
|  |     return RecurrenceDescriptor::MRK_UIntMax; | ||
|  |   case Intrinsic::experimental_vector_reduce_umin: | ||
|  |     return RecurrenceDescriptor::MRK_UIntMin; | ||
|  |   case Intrinsic::experimental_vector_reduce_fmax: | ||
|  |     return RecurrenceDescriptor::MRK_FloatMax; | ||
|  |   case Intrinsic::experimental_vector_reduce_fmin: | ||
|  |     return RecurrenceDescriptor::MRK_FloatMin; | ||
|  |   default: | ||
|  |     return RecurrenceDescriptor::MRK_Invalid; | ||
|  |   } | ||
|  | } | ||
|  | 
 | ||
|  | bool expandReductions(Function &F, const TargetTransformInfo *TTI) { | ||
|  |   bool Changed = false; | ||
|  |   SmallVector<IntrinsicInst*, 4> Worklist; | ||
|  |   for (inst_iterator I = inst_begin(F), E = inst_end(F); I != E; ++I) | ||
|  |     if (auto II = dyn_cast<IntrinsicInst>(&*I)) | ||
|  |       Worklist.push_back(II); | ||
|  | 
 | ||
|  |   for (auto *II : Worklist) { | ||
|  |     IRBuilder<> Builder(II); | ||
|  |     Value *Vec = nullptr; | ||
|  |     auto ID = II->getIntrinsicID(); | ||
|  |     auto MRK = RecurrenceDescriptor::MRK_Invalid; | ||
|  |     switch (ID) { | ||
|  |     case Intrinsic::experimental_vector_reduce_fadd: | ||
|  |     case Intrinsic::experimental_vector_reduce_fmul: | ||
|  |       // FMFs must be attached to the call, otherwise it's an ordered reduction
 | ||
|  |       // and it can't be handled by generating this shuffle sequence.
 | ||
|  |       // TODO: Implement scalarization of ordered reductions here for targets
 | ||
|  |       // without native support.
 | ||
|  |       if (!II->getFastMathFlags().isFast()) | ||
|  |         continue; | ||
|  |       Vec = II->getArgOperand(1); | ||
|  |       break; | ||
|  |     case Intrinsic::experimental_vector_reduce_add: | ||
|  |     case Intrinsic::experimental_vector_reduce_mul: | ||
|  |     case Intrinsic::experimental_vector_reduce_and: | ||
|  |     case Intrinsic::experimental_vector_reduce_or: | ||
|  |     case Intrinsic::experimental_vector_reduce_xor: | ||
|  |     case Intrinsic::experimental_vector_reduce_smax: | ||
|  |     case Intrinsic::experimental_vector_reduce_smin: | ||
|  |     case Intrinsic::experimental_vector_reduce_umax: | ||
|  |     case Intrinsic::experimental_vector_reduce_umin: | ||
|  |     case Intrinsic::experimental_vector_reduce_fmax: | ||
|  |     case Intrinsic::experimental_vector_reduce_fmin: | ||
|  |       Vec = II->getArgOperand(0); | ||
|  |       MRK = getMRK(ID); | ||
|  |       break; | ||
|  |     default: | ||
|  |       continue; | ||
|  |     } | ||
|  |     if (!TTI->shouldExpandReduction(II)) | ||
|  |       continue; | ||
|  |     auto Rdx = getShuffleReduction(Builder, Vec, getOpcode(ID), MRK); | ||
|  |     II->replaceAllUsesWith(Rdx); | ||
|  |     II->eraseFromParent(); | ||
|  |     Changed = true; | ||
|  |   } | ||
|  |   return Changed; | ||
|  | } | ||
|  | 
 | ||
|  | class ExpandReductions : public FunctionPass { | ||
|  | public: | ||
|  |   static char ID; | ||
|  |   ExpandReductions() : FunctionPass(ID) { | ||
|  |     initializeExpandReductionsPass(*PassRegistry::getPassRegistry()); | ||
|  |   } | ||
|  | 
 | ||
|  |   bool runOnFunction(Function &F) override { | ||
|  |     const auto *TTI =&getAnalysis<TargetTransformInfoWrapperPass>().getTTI(F); | ||
|  |     return expandReductions(F, TTI); | ||
|  |   } | ||
|  | 
 | ||
|  |   void getAnalysisUsage(AnalysisUsage &AU) const override { | ||
|  |     AU.addRequired<TargetTransformInfoWrapperPass>(); | ||
|  |     AU.setPreservesCFG(); | ||
|  |   } | ||
|  | }; | ||
|  | } | ||
|  | 
 | ||
|  | char ExpandReductions::ID; | ||
|  | INITIALIZE_PASS_BEGIN(ExpandReductions, "expand-reductions", | ||
|  |                       "Expand reduction intrinsics", false, false) | ||
|  | INITIALIZE_PASS_DEPENDENCY(TargetTransformInfoWrapperPass) | ||
|  | INITIALIZE_PASS_END(ExpandReductions, "expand-reductions", | ||
|  |                     "Expand reduction intrinsics", false, false) | ||
|  | 
 | ||
|  | FunctionPass *llvm::createExpandReductionsPass() { | ||
|  |   return new ExpandReductions(); | ||
|  | } | ||
|  | 
 | ||
|  | PreservedAnalyses ExpandReductionsPass::run(Function &F, | ||
|  |                                             FunctionAnalysisManager &AM) { | ||
|  |   const auto &TTI = AM.getResult<TargetIRAnalysis>(F); | ||
|  |   if (!expandReductions(F, &TTI)) | ||
|  |     return PreservedAnalyses::all(); | ||
|  |   PreservedAnalyses PA; | ||
|  |   PA.preserveSet<CFGAnalyses>(); | ||
|  |   return PA; | ||
|  | } |