//===- PPCBoolRetToInt.cpp ------------------------------------------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // This file implements converting i1 values to i32/i64 if they could be more // profitably allocated as GPRs rather than CRs. This pass will become totally // unnecessary if Register Bank Allocation and Global Instruction Selection ever // go upstream. // // Presently, the pass converts i1 Constants, and Arguments to i32/i64 if the // transitive closure of their uses includes only PHINodes, CallInsts, and // ReturnInsts. The rational is that arguments are generally passed and returned // in GPRs rather than CRs, so casting them to i32/i64 at the LLVM IR level will // actually save casts at the Machine Instruction level. // // It might be useful to expand this pass to add bit-wise operations to the list // of safe transitive closure types. Also, we miss some opportunities when LLVM // represents logical AND and OR operations with control flow rather than data // flow. For example by lowering the expression: return (A && B && C) // // as: return A ? true : B && C. // // There's code in SimplifyCFG that code be used to turn control flow in data // flow using SelectInsts. Selects are slow on some architectures (P7/P8), so // this probably isn't good in general, but for the special case of i1, the // Selects could be further lowered to bit operations that are fast everywhere. // //===----------------------------------------------------------------------===// #include "PPC.h" #include "PPCTargetMachine.h" #include "llvm/ADT/DenseMap.h" #include "llvm/ADT/STLExtras.h" #include "llvm/ADT/SmallPtrSet.h" #include "llvm/ADT/SmallVector.h" #include "llvm/ADT/Statistic.h" #include "llvm/IR/Argument.h" #include "llvm/IR/Constants.h" #include "llvm/IR/Dominators.h" #include "llvm/IR/Function.h" #include "llvm/IR/Instruction.h" #include "llvm/IR/Instructions.h" #include "llvm/IR/IntrinsicInst.h" #include "llvm/IR/OperandTraits.h" #include "llvm/IR/Type.h" #include "llvm/IR/Use.h" #include "llvm/IR/User.h" #include "llvm/IR/Value.h" #include "llvm/Pass.h" #include "llvm/CodeGen/TargetPassConfig.h" #include "llvm/Support/Casting.h" #include using namespace llvm; namespace { #define DEBUG_TYPE "ppc-bool-ret-to-int" STATISTIC(NumBoolRetPromotion, "Number of times a bool feeding a RetInst was promoted to an int"); STATISTIC(NumBoolCallPromotion, "Number of times a bool feeding a CallInst was promoted to an int"); STATISTIC(NumBoolToIntPromotion, "Total number of times a bool was promoted to an int"); class PPCBoolRetToInt : public FunctionPass { static SmallPtrSet findAllDefs(Value *V) { SmallPtrSet Defs; SmallVector WorkList; WorkList.push_back(V); Defs.insert(V); while (!WorkList.empty()) { Value *Curr = WorkList.pop_back_val(); auto *CurrUser = dyn_cast(Curr); // Operands of CallInst/Constant are skipped because they may not be Bool // type. For CallInst, their positions are defined by ABI. if (CurrUser && !isa(Curr) && !isa(Curr)) for (auto &Op : CurrUser->operands()) if (Defs.insert(Op).second) WorkList.push_back(Op); } return Defs; } // Translate a i1 value to an equivalent i32/i64 value: Value *translate(Value *V) { assert(V->getType() == Type::getInt1Ty(V->getContext()) && "Expect an i1 value"); Type *IntTy = ST->isPPC64() ? Type::getInt64Ty(V->getContext()) : Type::getInt32Ty(V->getContext()); if (auto *C = dyn_cast(V)) return ConstantExpr::getZExt(C, IntTy); if (auto *P = dyn_cast(V)) { // Temporarily set the operands to 0. We'll fix this later in // runOnUse. Value *Zero = Constant::getNullValue(IntTy); PHINode *Q = PHINode::Create(IntTy, P->getNumIncomingValues(), P->getName(), P); for (unsigned i = 0; i < P->getNumOperands(); ++i) Q->addIncoming(Zero, P->getIncomingBlock(i)); return Q; } auto *A = dyn_cast(V); auto *I = dyn_cast(V); assert((A || I) && "Unknown value type"); auto InstPt = A ? &*A->getParent()->getEntryBlock().begin() : I->getNextNode(); return new ZExtInst(V, IntTy, "", InstPt); } typedef SmallPtrSet PHINodeSet; // A PHINode is Promotable if: // 1. Its type is i1 AND // 2. All of its uses are ReturnInt, CallInst, PHINode, or DbgInfoIntrinsic // AND // 3. All of its operands are Constant or Argument or // CallInst or PHINode AND // 4. All of its PHINode uses are Promotable AND // 5. All of its PHINode operands are Promotable static PHINodeSet getPromotablePHINodes(const Function &F) { PHINodeSet Promotable; // Condition 1 for (auto &BB : F) for (auto &I : BB) if (const auto *P = dyn_cast(&I)) if (P->getType()->isIntegerTy(1)) Promotable.insert(P); SmallVector ToRemove; for (const PHINode *P : Promotable) { // Condition 2 and 3 auto IsValidUser = [] (const Value *V) -> bool { return isa(V) || isa(V) || isa(V) || isa(V); }; auto IsValidOperand = [] (const Value *V) -> bool { return isa(V) || isa(V) || isa(V) || isa(V); }; const auto &Users = P->users(); const auto &Operands = P->operands(); if (!llvm::all_of(Users, IsValidUser) || !llvm::all_of(Operands, IsValidOperand)) ToRemove.push_back(P); } // Iterate to convergence auto IsPromotable = [&Promotable] (const Value *V) -> bool { const auto *Phi = dyn_cast(V); return !Phi || Promotable.count(Phi); }; while (!ToRemove.empty()) { for (auto &User : ToRemove) Promotable.erase(User); ToRemove.clear(); for (const PHINode *P : Promotable) { // Condition 4 and 5 const auto &Users = P->users(); const auto &Operands = P->operands(); if (!llvm::all_of(Users, IsPromotable) || !llvm::all_of(Operands, IsPromotable)) ToRemove.push_back(P); } } return Promotable; } typedef DenseMap B2IMap; public: static char ID; PPCBoolRetToInt() : FunctionPass(ID) { initializePPCBoolRetToIntPass(*PassRegistry::getPassRegistry()); } bool runOnFunction(Function &F) override { if (skipFunction(F)) return false; auto *TPC = getAnalysisIfAvailable(); if (!TPC) return false; auto &TM = TPC->getTM(); ST = TM.getSubtargetImpl(F); PHINodeSet PromotablePHINodes = getPromotablePHINodes(F); B2IMap Bool2IntMap; bool Changed = false; for (auto &BB : F) { for (auto &I : BB) { if (auto *R = dyn_cast(&I)) if (F.getReturnType()->isIntegerTy(1)) Changed |= runOnUse(R->getOperandUse(0), PromotablePHINodes, Bool2IntMap); if (auto *CI = dyn_cast(&I)) for (auto &U : CI->operands()) if (U->getType()->isIntegerTy(1)) Changed |= runOnUse(U, PromotablePHINodes, Bool2IntMap); } } return Changed; } bool runOnUse(Use &U, const PHINodeSet &PromotablePHINodes, B2IMap &BoolToIntMap) { auto Defs = findAllDefs(U); // If the values are all Constants or Arguments, don't bother if (llvm::none_of(Defs, [](Value *V) { return isa(V); })) return false; // Presently, we only know how to handle PHINode, Constant, Arguments and // CallInst. Potentially, bitwise operations (AND, OR, XOR, NOT) and sign // extension could also be handled in the future. for (Value *V : Defs) if (!isa(V) && !isa(V) && !isa(V) && !isa(V)) return false; for (Value *V : Defs) if (const auto *P = dyn_cast(V)) if (!PromotablePHINodes.count(P)) return false; if (isa(U.getUser())) ++NumBoolRetPromotion; if (isa(U.getUser())) ++NumBoolCallPromotion; ++NumBoolToIntPromotion; for (Value *V : Defs) if (!BoolToIntMap.count(V)) BoolToIntMap[V] = translate(V); // Replace the operands of the translated instructions. They were set to // zero in the translate function. for (auto &Pair : BoolToIntMap) { auto *First = dyn_cast(Pair.first); auto *Second = dyn_cast(Pair.second); assert((!First || Second) && "translated from user to non-user!?"); // Operands of CallInst/Constant are skipped because they may not be Bool // type. For CallInst, their positions are defined by ABI. if (First && !isa(First) && !isa(First)) for (unsigned i = 0; i < First->getNumOperands(); ++i) Second->setOperand(i, BoolToIntMap[First->getOperand(i)]); } Value *IntRetVal = BoolToIntMap[U]; Type *Int1Ty = Type::getInt1Ty(U->getContext()); auto *I = cast(U.getUser()); Value *BackToBool = new TruncInst(IntRetVal, Int1Ty, "backToBool", I); U.set(BackToBool); return true; } void getAnalysisUsage(AnalysisUsage &AU) const override { AU.addPreserved(); FunctionPass::getAnalysisUsage(AU); } private: const PPCSubtarget *ST; }; } // end anonymous namespace char PPCBoolRetToInt::ID = 0; INITIALIZE_PASS(PPCBoolRetToInt, "ppc-bool-ret-to-int", "Convert i1 constants to i32/i64 if they are returned", false, false) FunctionPass *llvm::createPPCBoolRetToIntPass() { return new PPCBoolRetToInt(); }