xref: /aosp_15_r20/external/llvm/lib/Target/NVPTX/NVPTXFavorNonGenericAddrSpaces.cpp (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker //===-- NVPTXFavorNonGenericAddrSpace.cpp - ---------------------*- C++ -*-===//
2*9880d681SAndroid Build Coastguard Worker //
3*9880d681SAndroid Build Coastguard Worker //                     The LLVM Compiler Infrastructure
4*9880d681SAndroid Build Coastguard Worker //
5*9880d681SAndroid Build Coastguard Worker // This file is distributed under the University of Illinois Open Source
6*9880d681SAndroid Build Coastguard Worker // License. See LICENSE.TXT for details.
7*9880d681SAndroid Build Coastguard Worker //
8*9880d681SAndroid Build Coastguard Worker //===----------------------------------------------------------------------===//
9*9880d681SAndroid Build Coastguard Worker //
10*9880d681SAndroid Build Coastguard Worker // FIXME: This pass is deprecated in favor of NVPTXInferAddressSpaces, which
11*9880d681SAndroid Build Coastguard Worker // uses a new algorithm that handles pointer induction variables.
12*9880d681SAndroid Build Coastguard Worker //
13*9880d681SAndroid Build Coastguard Worker // When a load/store accesses the generic address space, checks whether the
14*9880d681SAndroid Build Coastguard Worker // address is casted from a non-generic address space. If so, remove this
15*9880d681SAndroid Build Coastguard Worker // addrspacecast because accessing non-generic address spaces is typically
16*9880d681SAndroid Build Coastguard Worker // faster. Besides removing addrspacecasts directly used by loads/stores, this
17*9880d681SAndroid Build Coastguard Worker // optimization also recursively traces into a GEP's pointer operand and a
18*9880d681SAndroid Build Coastguard Worker // bitcast's source to find more eliminable addrspacecasts.
19*9880d681SAndroid Build Coastguard Worker //
20*9880d681SAndroid Build Coastguard Worker // For instance, the code below loads a float from an array allocated in
21*9880d681SAndroid Build Coastguard Worker // addrspace(3).
22*9880d681SAndroid Build Coastguard Worker //
23*9880d681SAndroid Build Coastguard Worker //   %0 = addrspacecast [10 x float] addrspace(3)* @a to [10 x float]*
24*9880d681SAndroid Build Coastguard Worker //   %1 = gep [10 x float]* %0, i64 0, i64 %i
25*9880d681SAndroid Build Coastguard Worker //   %2 = bitcast float* %1 to i32*
26*9880d681SAndroid Build Coastguard Worker //   %3 = load i32* %2 ; emits ld.u32
27*9880d681SAndroid Build Coastguard Worker //
28*9880d681SAndroid Build Coastguard Worker // First, function hoistAddrSpaceCastFrom reorders the addrspacecast, the GEP,
29*9880d681SAndroid Build Coastguard Worker // and the bitcast to expose more optimization opportunities to function
30*9880d681SAndroid Build Coastguard Worker // optimizeMemoryInst. The intermediate code looks like:
31*9880d681SAndroid Build Coastguard Worker //
32*9880d681SAndroid Build Coastguard Worker //   %0 = gep [10 x float] addrspace(3)* @a, i64 0, i64 %i
33*9880d681SAndroid Build Coastguard Worker //   %1 = bitcast float addrspace(3)* %0 to i32 addrspace(3)*
34*9880d681SAndroid Build Coastguard Worker //   %2 = addrspacecast i32 addrspace(3)* %1 to i32*
35*9880d681SAndroid Build Coastguard Worker //   %3 = load i32* %2 ; still emits ld.u32, but will be optimized shortly
36*9880d681SAndroid Build Coastguard Worker //
37*9880d681SAndroid Build Coastguard Worker // Then, function optimizeMemoryInstruction detects a load from addrspacecast'ed
38*9880d681SAndroid Build Coastguard Worker // generic pointers, and folds the load and the addrspacecast into a load from
39*9880d681SAndroid Build Coastguard Worker // the original address space. The final code looks like:
40*9880d681SAndroid Build Coastguard Worker //
41*9880d681SAndroid Build Coastguard Worker //   %0 = gep [10 x float] addrspace(3)* @a, i64 0, i64 %i
42*9880d681SAndroid Build Coastguard Worker //   %1 = bitcast float addrspace(3)* %0 to i32 addrspace(3)*
43*9880d681SAndroid Build Coastguard Worker //   %3 = load i32 addrspace(3)* %1 ; emits ld.shared.f32
44*9880d681SAndroid Build Coastguard Worker //
45*9880d681SAndroid Build Coastguard Worker // This pass may remove an addrspacecast in a different BB. Therefore, we
46*9880d681SAndroid Build Coastguard Worker // implement it as a FunctionPass.
47*9880d681SAndroid Build Coastguard Worker //
48*9880d681SAndroid Build Coastguard Worker // TODO:
49*9880d681SAndroid Build Coastguard Worker // The current implementation doesn't handle PHINodes. Eliminating
50*9880d681SAndroid Build Coastguard Worker // addrspacecasts used by PHINodes is trickier because PHINodes can introduce
51*9880d681SAndroid Build Coastguard Worker // loops in data flow. For example,
52*9880d681SAndroid Build Coastguard Worker //
53*9880d681SAndroid Build Coastguard Worker //     %generic.input = addrspacecast float addrspace(3)* %input to float*
54*9880d681SAndroid Build Coastguard Worker //   loop:
55*9880d681SAndroid Build Coastguard Worker //     %y = phi [ %generic.input, %y2 ]
56*9880d681SAndroid Build Coastguard Worker //     %y2 = getelementptr %y, 1
57*9880d681SAndroid Build Coastguard Worker //     %v = load %y2
58*9880d681SAndroid Build Coastguard Worker //     br ..., label %loop, ...
59*9880d681SAndroid Build Coastguard Worker //
60*9880d681SAndroid Build Coastguard Worker // Marking %y2 shared depends on marking %y shared, but %y also data-flow
61*9880d681SAndroid Build Coastguard Worker // depends on %y2. We probably need an iterative fix-point algorithm on handle
62*9880d681SAndroid Build Coastguard Worker // this case.
63*9880d681SAndroid Build Coastguard Worker //
64*9880d681SAndroid Build Coastguard Worker //===----------------------------------------------------------------------===//
65*9880d681SAndroid Build Coastguard Worker 
66*9880d681SAndroid Build Coastguard Worker #include "NVPTX.h"
67*9880d681SAndroid Build Coastguard Worker #include "llvm/IR/Function.h"
68*9880d681SAndroid Build Coastguard Worker #include "llvm/IR/Instructions.h"
69*9880d681SAndroid Build Coastguard Worker #include "llvm/IR/Operator.h"
70*9880d681SAndroid Build Coastguard Worker #include "llvm/Support/CommandLine.h"
71*9880d681SAndroid Build Coastguard Worker 
72*9880d681SAndroid Build Coastguard Worker using namespace llvm;
73*9880d681SAndroid Build Coastguard Worker 
74*9880d681SAndroid Build Coastguard Worker // An option to disable this optimization. Enable it by default.
75*9880d681SAndroid Build Coastguard Worker static cl::opt<bool> DisableFavorNonGeneric(
76*9880d681SAndroid Build Coastguard Worker   "disable-nvptx-favor-non-generic",
77*9880d681SAndroid Build Coastguard Worker   cl::init(false),
78*9880d681SAndroid Build Coastguard Worker   cl::desc("Do not convert generic address space usage "
79*9880d681SAndroid Build Coastguard Worker            "to non-generic address space usage"),
80*9880d681SAndroid Build Coastguard Worker   cl::Hidden);
81*9880d681SAndroid Build Coastguard Worker 
82*9880d681SAndroid Build Coastguard Worker namespace {
83*9880d681SAndroid Build Coastguard Worker /// \brief NVPTXFavorNonGenericAddrSpaces
84*9880d681SAndroid Build Coastguard Worker class NVPTXFavorNonGenericAddrSpaces : public FunctionPass {
85*9880d681SAndroid Build Coastguard Worker public:
86*9880d681SAndroid Build Coastguard Worker   static char ID;
NVPTXFavorNonGenericAddrSpaces()87*9880d681SAndroid Build Coastguard Worker   NVPTXFavorNonGenericAddrSpaces() : FunctionPass(ID) {}
88*9880d681SAndroid Build Coastguard Worker   bool runOnFunction(Function &F) override;
89*9880d681SAndroid Build Coastguard Worker 
90*9880d681SAndroid Build Coastguard Worker private:
91*9880d681SAndroid Build Coastguard Worker   /// Optimizes load/store instructions. Idx is the index of the pointer operand
92*9880d681SAndroid Build Coastguard Worker   /// (0 for load, and 1 for store). Returns true if it changes anything.
93*9880d681SAndroid Build Coastguard Worker   bool optimizeMemoryInstruction(Instruction *I, unsigned Idx);
94*9880d681SAndroid Build Coastguard Worker   /// Recursively traces into a GEP's pointer operand or a bitcast's source to
95*9880d681SAndroid Build Coastguard Worker   /// find an eliminable addrspacecast, and hoists that addrspacecast to the
96*9880d681SAndroid Build Coastguard Worker   /// outermost level. For example, this function transforms
97*9880d681SAndroid Build Coastguard Worker   ///   bitcast(gep(gep(addrspacecast(X))))
98*9880d681SAndroid Build Coastguard Worker   /// to
99*9880d681SAndroid Build Coastguard Worker   ///   addrspacecast(bitcast(gep(gep(X)))).
100*9880d681SAndroid Build Coastguard Worker   ///
101*9880d681SAndroid Build Coastguard Worker   /// This reordering exposes to optimizeMemoryInstruction more
102*9880d681SAndroid Build Coastguard Worker   /// optimization opportunities on loads and stores.
103*9880d681SAndroid Build Coastguard Worker   ///
104*9880d681SAndroid Build Coastguard Worker   /// If this function successfully hoists an eliminable addrspacecast or V is
105*9880d681SAndroid Build Coastguard Worker   /// already such an addrspacecast, it returns the transformed value (which is
106*9880d681SAndroid Build Coastguard Worker   /// guaranteed to be an addrspacecast); otherwise, it returns nullptr.
107*9880d681SAndroid Build Coastguard Worker   Value *hoistAddrSpaceCastFrom(Value *V, int Depth = 0);
108*9880d681SAndroid Build Coastguard Worker   /// Helper function for GEPs.
109*9880d681SAndroid Build Coastguard Worker   Value *hoistAddrSpaceCastFromGEP(GEPOperator *GEP, int Depth);
110*9880d681SAndroid Build Coastguard Worker   /// Helper function for bitcasts.
111*9880d681SAndroid Build Coastguard Worker   Value *hoistAddrSpaceCastFromBitCast(BitCastOperator *BC, int Depth);
112*9880d681SAndroid Build Coastguard Worker };
113*9880d681SAndroid Build Coastguard Worker }
114*9880d681SAndroid Build Coastguard Worker 
115*9880d681SAndroid Build Coastguard Worker char NVPTXFavorNonGenericAddrSpaces::ID = 0;
116*9880d681SAndroid Build Coastguard Worker 
117*9880d681SAndroid Build Coastguard Worker namespace llvm {
118*9880d681SAndroid Build Coastguard Worker void initializeNVPTXFavorNonGenericAddrSpacesPass(PassRegistry &);
119*9880d681SAndroid Build Coastguard Worker }
120*9880d681SAndroid Build Coastguard Worker INITIALIZE_PASS(NVPTXFavorNonGenericAddrSpaces, "nvptx-favor-non-generic",
121*9880d681SAndroid Build Coastguard Worker                 "Remove unnecessary non-generic-to-generic addrspacecasts",
122*9880d681SAndroid Build Coastguard Worker                 false, false)
123*9880d681SAndroid Build Coastguard Worker 
124*9880d681SAndroid Build Coastguard Worker // Decides whether V is an addrspacecast and shortcutting V in load/store is
125*9880d681SAndroid Build Coastguard Worker // valid and beneficial.
isEliminableAddrSpaceCast(Value * V)126*9880d681SAndroid Build Coastguard Worker static bool isEliminableAddrSpaceCast(Value *V) {
127*9880d681SAndroid Build Coastguard Worker   // Returns false if V is not even an addrspacecast.
128*9880d681SAndroid Build Coastguard Worker   Operator *Cast = dyn_cast<Operator>(V);
129*9880d681SAndroid Build Coastguard Worker   if (Cast == nullptr || Cast->getOpcode() != Instruction::AddrSpaceCast)
130*9880d681SAndroid Build Coastguard Worker     return false;
131*9880d681SAndroid Build Coastguard Worker 
132*9880d681SAndroid Build Coastguard Worker   Value *Src = Cast->getOperand(0);
133*9880d681SAndroid Build Coastguard Worker   PointerType *SrcTy = cast<PointerType>(Src->getType());
134*9880d681SAndroid Build Coastguard Worker   PointerType *DestTy = cast<PointerType>(Cast->getType());
135*9880d681SAndroid Build Coastguard Worker   // TODO: For now, we only handle the case where the addrspacecast only changes
136*9880d681SAndroid Build Coastguard Worker   // the address space but not the type. If the type also changes, we could
137*9880d681SAndroid Build Coastguard Worker   // still get rid of the addrspacecast by adding an extra bitcast, but we
138*9880d681SAndroid Build Coastguard Worker   // rarely see such scenarios.
139*9880d681SAndroid Build Coastguard Worker   if (SrcTy->getElementType() != DestTy->getElementType())
140*9880d681SAndroid Build Coastguard Worker     return false;
141*9880d681SAndroid Build Coastguard Worker 
142*9880d681SAndroid Build Coastguard Worker   // Checks whether the addrspacecast is from a non-generic address space to the
143*9880d681SAndroid Build Coastguard Worker   // generic address space.
144*9880d681SAndroid Build Coastguard Worker   return (SrcTy->getAddressSpace() != AddressSpace::ADDRESS_SPACE_GENERIC &&
145*9880d681SAndroid Build Coastguard Worker           DestTy->getAddressSpace() == AddressSpace::ADDRESS_SPACE_GENERIC);
146*9880d681SAndroid Build Coastguard Worker }
147*9880d681SAndroid Build Coastguard Worker 
hoistAddrSpaceCastFromGEP(GEPOperator * GEP,int Depth)148*9880d681SAndroid Build Coastguard Worker Value *NVPTXFavorNonGenericAddrSpaces::hoistAddrSpaceCastFromGEP(
149*9880d681SAndroid Build Coastguard Worker     GEPOperator *GEP, int Depth) {
150*9880d681SAndroid Build Coastguard Worker   Value *NewOperand =
151*9880d681SAndroid Build Coastguard Worker       hoistAddrSpaceCastFrom(GEP->getPointerOperand(), Depth + 1);
152*9880d681SAndroid Build Coastguard Worker   if (NewOperand == nullptr)
153*9880d681SAndroid Build Coastguard Worker     return nullptr;
154*9880d681SAndroid Build Coastguard Worker 
155*9880d681SAndroid Build Coastguard Worker   // hoistAddrSpaceCastFrom returns an eliminable addrspacecast or nullptr.
156*9880d681SAndroid Build Coastguard Worker   assert(isEliminableAddrSpaceCast(NewOperand));
157*9880d681SAndroid Build Coastguard Worker   Operator *Cast = cast<Operator>(NewOperand);
158*9880d681SAndroid Build Coastguard Worker 
159*9880d681SAndroid Build Coastguard Worker   SmallVector<Value *, 8> Indices(GEP->idx_begin(), GEP->idx_end());
160*9880d681SAndroid Build Coastguard Worker   Value *NewASC;
161*9880d681SAndroid Build Coastguard Worker   if (Instruction *GEPI = dyn_cast<Instruction>(GEP)) {
162*9880d681SAndroid Build Coastguard Worker     // GEP = gep (addrspacecast X), indices
163*9880d681SAndroid Build Coastguard Worker     // =>
164*9880d681SAndroid Build Coastguard Worker     // NewGEP = gep X, indices
165*9880d681SAndroid Build Coastguard Worker     // NewASC = addrspacecast NewGEP
166*9880d681SAndroid Build Coastguard Worker     GetElementPtrInst *NewGEP = GetElementPtrInst::Create(
167*9880d681SAndroid Build Coastguard Worker         GEP->getSourceElementType(), Cast->getOperand(0), Indices,
168*9880d681SAndroid Build Coastguard Worker         "", GEPI);
169*9880d681SAndroid Build Coastguard Worker     NewGEP->setIsInBounds(GEP->isInBounds());
170*9880d681SAndroid Build Coastguard Worker     NewGEP->takeName(GEP);
171*9880d681SAndroid Build Coastguard Worker     NewASC = new AddrSpaceCastInst(NewGEP, GEP->getType(), "", GEPI);
172*9880d681SAndroid Build Coastguard Worker     // Without RAUWing GEP, the compiler would visit GEP again and emit
173*9880d681SAndroid Build Coastguard Worker     // redundant instructions. This is exercised in test @rauw in
174*9880d681SAndroid Build Coastguard Worker     // access-non-generic.ll.
175*9880d681SAndroid Build Coastguard Worker     GEP->replaceAllUsesWith(NewASC);
176*9880d681SAndroid Build Coastguard Worker   } else {
177*9880d681SAndroid Build Coastguard Worker     // GEP is a constant expression.
178*9880d681SAndroid Build Coastguard Worker     Constant *NewGEP = ConstantExpr::getGetElementPtr(
179*9880d681SAndroid Build Coastguard Worker         GEP->getSourceElementType(), cast<Constant>(Cast->getOperand(0)),
180*9880d681SAndroid Build Coastguard Worker         Indices, GEP->isInBounds());
181*9880d681SAndroid Build Coastguard Worker     NewASC = ConstantExpr::getAddrSpaceCast(NewGEP, GEP->getType());
182*9880d681SAndroid Build Coastguard Worker   }
183*9880d681SAndroid Build Coastguard Worker   return NewASC;
184*9880d681SAndroid Build Coastguard Worker }
185*9880d681SAndroid Build Coastguard Worker 
hoistAddrSpaceCastFromBitCast(BitCastOperator * BC,int Depth)186*9880d681SAndroid Build Coastguard Worker Value *NVPTXFavorNonGenericAddrSpaces::hoistAddrSpaceCastFromBitCast(
187*9880d681SAndroid Build Coastguard Worker     BitCastOperator *BC, int Depth) {
188*9880d681SAndroid Build Coastguard Worker   Value *NewOperand = hoistAddrSpaceCastFrom(BC->getOperand(0), Depth + 1);
189*9880d681SAndroid Build Coastguard Worker   if (NewOperand == nullptr)
190*9880d681SAndroid Build Coastguard Worker     return nullptr;
191*9880d681SAndroid Build Coastguard Worker 
192*9880d681SAndroid Build Coastguard Worker   // hoistAddrSpaceCastFrom returns an eliminable addrspacecast or nullptr.
193*9880d681SAndroid Build Coastguard Worker   assert(isEliminableAddrSpaceCast(NewOperand));
194*9880d681SAndroid Build Coastguard Worker   Operator *Cast = cast<Operator>(NewOperand);
195*9880d681SAndroid Build Coastguard Worker 
196*9880d681SAndroid Build Coastguard Worker   // Cast  = addrspacecast Src
197*9880d681SAndroid Build Coastguard Worker   // BC    = bitcast Cast
198*9880d681SAndroid Build Coastguard Worker   //   =>
199*9880d681SAndroid Build Coastguard Worker   // Cast' = bitcast Src
200*9880d681SAndroid Build Coastguard Worker   // BC'   = addrspacecast Cast'
201*9880d681SAndroid Build Coastguard Worker   Value *Src = Cast->getOperand(0);
202*9880d681SAndroid Build Coastguard Worker   Type *TypeOfNewCast =
203*9880d681SAndroid Build Coastguard Worker       PointerType::get(BC->getType()->getPointerElementType(),
204*9880d681SAndroid Build Coastguard Worker                        Src->getType()->getPointerAddressSpace());
205*9880d681SAndroid Build Coastguard Worker   Value *NewBC;
206*9880d681SAndroid Build Coastguard Worker   if (BitCastInst *BCI = dyn_cast<BitCastInst>(BC)) {
207*9880d681SAndroid Build Coastguard Worker     Value *NewCast = new BitCastInst(Src, TypeOfNewCast, "", BCI);
208*9880d681SAndroid Build Coastguard Worker     NewBC = new AddrSpaceCastInst(NewCast, BC->getType(), "", BCI);
209*9880d681SAndroid Build Coastguard Worker     NewBC->takeName(BC);
210*9880d681SAndroid Build Coastguard Worker     // Without RAUWing BC, the compiler would visit BC again and emit
211*9880d681SAndroid Build Coastguard Worker     // redundant instructions. This is exercised in test @rauw in
212*9880d681SAndroid Build Coastguard Worker     // access-non-generic.ll.
213*9880d681SAndroid Build Coastguard Worker     BC->replaceAllUsesWith(NewBC);
214*9880d681SAndroid Build Coastguard Worker   } else {
215*9880d681SAndroid Build Coastguard Worker     // BC is a constant expression.
216*9880d681SAndroid Build Coastguard Worker     Constant *NewCast =
217*9880d681SAndroid Build Coastguard Worker         ConstantExpr::getBitCast(cast<Constant>(Src), TypeOfNewCast);
218*9880d681SAndroid Build Coastguard Worker     NewBC = ConstantExpr::getAddrSpaceCast(NewCast, BC->getType());
219*9880d681SAndroid Build Coastguard Worker   }
220*9880d681SAndroid Build Coastguard Worker   return NewBC;
221*9880d681SAndroid Build Coastguard Worker }
222*9880d681SAndroid Build Coastguard Worker 
hoistAddrSpaceCastFrom(Value * V,int Depth)223*9880d681SAndroid Build Coastguard Worker Value *NVPTXFavorNonGenericAddrSpaces::hoistAddrSpaceCastFrom(Value *V,
224*9880d681SAndroid Build Coastguard Worker                                                               int Depth) {
225*9880d681SAndroid Build Coastguard Worker   // Returns V if V is already an eliminable addrspacecast.
226*9880d681SAndroid Build Coastguard Worker   if (isEliminableAddrSpaceCast(V))
227*9880d681SAndroid Build Coastguard Worker     return V;
228*9880d681SAndroid Build Coastguard Worker 
229*9880d681SAndroid Build Coastguard Worker   // Limit the depth to prevent this recursive function from running too long.
230*9880d681SAndroid Build Coastguard Worker   const int MaxDepth = 20;
231*9880d681SAndroid Build Coastguard Worker   if (Depth >= MaxDepth)
232*9880d681SAndroid Build Coastguard Worker     return nullptr;
233*9880d681SAndroid Build Coastguard Worker 
234*9880d681SAndroid Build Coastguard Worker   // If V is a GEP or bitcast, hoist the addrspacecast if any from its pointer
235*9880d681SAndroid Build Coastguard Worker   // operand. This enables optimizeMemoryInstruction to shortcut addrspacecasts
236*9880d681SAndroid Build Coastguard Worker   // that are not directly used by the load/store.
237*9880d681SAndroid Build Coastguard Worker   if (GEPOperator *GEP = dyn_cast<GEPOperator>(V))
238*9880d681SAndroid Build Coastguard Worker     return hoistAddrSpaceCastFromGEP(GEP, Depth);
239*9880d681SAndroid Build Coastguard Worker 
240*9880d681SAndroid Build Coastguard Worker   if (BitCastOperator *BC = dyn_cast<BitCastOperator>(V))
241*9880d681SAndroid Build Coastguard Worker     return hoistAddrSpaceCastFromBitCast(BC, Depth);
242*9880d681SAndroid Build Coastguard Worker 
243*9880d681SAndroid Build Coastguard Worker   return nullptr;
244*9880d681SAndroid Build Coastguard Worker }
245*9880d681SAndroid Build Coastguard Worker 
optimizeMemoryInstruction(Instruction * MI,unsigned Idx)246*9880d681SAndroid Build Coastguard Worker bool NVPTXFavorNonGenericAddrSpaces::optimizeMemoryInstruction(Instruction *MI,
247*9880d681SAndroid Build Coastguard Worker                                                                unsigned Idx) {
248*9880d681SAndroid Build Coastguard Worker   Value *NewOperand = hoistAddrSpaceCastFrom(MI->getOperand(Idx));
249*9880d681SAndroid Build Coastguard Worker   if (NewOperand == nullptr)
250*9880d681SAndroid Build Coastguard Worker     return false;
251*9880d681SAndroid Build Coastguard Worker 
252*9880d681SAndroid Build Coastguard Worker   // load/store (addrspacecast X) => load/store X if shortcutting the
253*9880d681SAndroid Build Coastguard Worker   // addrspacecast is valid and can improve performance.
254*9880d681SAndroid Build Coastguard Worker   //
255*9880d681SAndroid Build Coastguard Worker   // e.g.,
256*9880d681SAndroid Build Coastguard Worker   // %1 = addrspacecast float addrspace(3)* %0 to float*
257*9880d681SAndroid Build Coastguard Worker   // %2 = load float* %1
258*9880d681SAndroid Build Coastguard Worker   // ->
259*9880d681SAndroid Build Coastguard Worker   // %2 = load float addrspace(3)* %0
260*9880d681SAndroid Build Coastguard Worker   //
261*9880d681SAndroid Build Coastguard Worker   // Note: the addrspacecast can also be a constant expression.
262*9880d681SAndroid Build Coastguard Worker   assert(isEliminableAddrSpaceCast(NewOperand));
263*9880d681SAndroid Build Coastguard Worker   Operator *ASC = dyn_cast<Operator>(NewOperand);
264*9880d681SAndroid Build Coastguard Worker   MI->setOperand(Idx, ASC->getOperand(0));
265*9880d681SAndroid Build Coastguard Worker   return true;
266*9880d681SAndroid Build Coastguard Worker }
267*9880d681SAndroid Build Coastguard Worker 
runOnFunction(Function & F)268*9880d681SAndroid Build Coastguard Worker bool NVPTXFavorNonGenericAddrSpaces::runOnFunction(Function &F) {
269*9880d681SAndroid Build Coastguard Worker   if (DisableFavorNonGeneric || skipFunction(F))
270*9880d681SAndroid Build Coastguard Worker     return false;
271*9880d681SAndroid Build Coastguard Worker 
272*9880d681SAndroid Build Coastguard Worker   bool Changed = false;
273*9880d681SAndroid Build Coastguard Worker   for (BasicBlock &B : F) {
274*9880d681SAndroid Build Coastguard Worker     for (Instruction &I : B) {
275*9880d681SAndroid Build Coastguard Worker       if (isa<LoadInst>(I)) {
276*9880d681SAndroid Build Coastguard Worker         // V = load P
277*9880d681SAndroid Build Coastguard Worker         Changed |= optimizeMemoryInstruction(&I, 0);
278*9880d681SAndroid Build Coastguard Worker       } else if (isa<StoreInst>(I)) {
279*9880d681SAndroid Build Coastguard Worker         // store V, P
280*9880d681SAndroid Build Coastguard Worker         Changed |= optimizeMemoryInstruction(&I, 1);
281*9880d681SAndroid Build Coastguard Worker       }
282*9880d681SAndroid Build Coastguard Worker     }
283*9880d681SAndroid Build Coastguard Worker   }
284*9880d681SAndroid Build Coastguard Worker   return Changed;
285*9880d681SAndroid Build Coastguard Worker }
286*9880d681SAndroid Build Coastguard Worker 
createNVPTXFavorNonGenericAddrSpacesPass()287*9880d681SAndroid Build Coastguard Worker FunctionPass *llvm::createNVPTXFavorNonGenericAddrSpacesPass() {
288*9880d681SAndroid Build Coastguard Worker   return new NVPTXFavorNonGenericAddrSpaces();
289*9880d681SAndroid Build Coastguard Worker }
290