LLVM  8.0.1
NVPTXImageOptimizer.cpp
Go to the documentation of this file.
1 //===-- NVPTXImageOptimizer.cpp - Image optimization pass -----------------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This pass implements IR-level optimizations of image access code,
11 // including:
12 //
13 // 1. Eliminate istypep intrinsics when image access qualifier is known
14 //
15 //===----------------------------------------------------------------------===//
16 
17 #include "NVPTX.h"
18 #include "NVPTXUtilities.h"
20 #include "llvm/IR/Instructions.h"
21 #include "llvm/IR/Intrinsics.h"
22 #include "llvm/IR/Module.h"
23 #include "llvm/Pass.h"
24 
25 using namespace llvm;
26 
27 namespace {
28 class NVPTXImageOptimizer : public FunctionPass {
29 private:
30  static char ID;
31  SmallVector<Instruction*, 4> InstrToDelete;
32 
33 public:
34  NVPTXImageOptimizer();
35 
36  bool runOnFunction(Function &F) override;
37 
38 private:
39  bool replaceIsTypePSampler(Instruction &I);
40  bool replaceIsTypePSurface(Instruction &I);
41  bool replaceIsTypePTexture(Instruction &I);
42  Value *cleanupValue(Value *V);
43  void replaceWith(Instruction *From, ConstantInt *To);
44 };
45 }
46 
48 
49 NVPTXImageOptimizer::NVPTXImageOptimizer()
50  : FunctionPass(ID) {}
51 
53  if (skipFunction(F))
54  return false;
55 
56  bool Changed = false;
57  InstrToDelete.clear();
58 
59  // Look for call instructions in the function
60  for (Function::iterator BI = F.begin(), BE = F.end(); BI != BE;
61  ++BI) {
62  for (BasicBlock::iterator I = (*BI).begin(), E = (*BI).end();
63  I != E; ++I) {
64  Instruction &Instr = *I;
65  if (CallInst *CI = dyn_cast<CallInst>(I)) {
66  Function *CalledF = CI->getCalledFunction();
67  if (CalledF && CalledF->isIntrinsic()) {
68  // This is an intrinsic function call, check if its an istypep
69  switch (CalledF->getIntrinsicID()) {
70  default: break;
72  Changed |= replaceIsTypePSampler(Instr);
73  break;
75  Changed |= replaceIsTypePSurface(Instr);
76  break;
78  Changed |= replaceIsTypePTexture(Instr);
79  break;
80  }
81  }
82  }
83  }
84  }
85 
86  // Delete any istypep instances we replaced in the IR
87  for (unsigned i = 0, e = InstrToDelete.size(); i != e; ++i)
88  InstrToDelete[i]->eraseFromParent();
89 
90  return Changed;
91 }
92 
93 bool NVPTXImageOptimizer::replaceIsTypePSampler(Instruction &I) {
94  Value *TexHandle = cleanupValue(I.getOperand(0));
95  if (isSampler(*TexHandle)) {
96  // This is an OpenCL sampler, so it must be a samplerref
97  replaceWith(&I, ConstantInt::getTrue(I.getContext()));
98  return true;
99  } else if (isImage(*TexHandle)) {
100  // This is an OpenCL image, so it cannot be a samplerref
101  replaceWith(&I, ConstantInt::getFalse(I.getContext()));
102  return true;
103  } else {
104  // The image type is unknown, so we cannot eliminate the intrinsic
105  return false;
106  }
107 }
108 
109 bool NVPTXImageOptimizer::replaceIsTypePSurface(Instruction &I) {
110  Value *TexHandle = cleanupValue(I.getOperand(0));
111  if (isImageReadWrite(*TexHandle) ||
112  isImageWriteOnly(*TexHandle)) {
113  // This is an OpenCL read-only/read-write image, so it must be a surfref
114  replaceWith(&I, ConstantInt::getTrue(I.getContext()));
115  return true;
116  } else if (isImageReadOnly(*TexHandle) ||
117  isSampler(*TexHandle)) {
118  // This is an OpenCL read-only/ imageor sampler, so it cannot be
119  // a surfref
120  replaceWith(&I, ConstantInt::getFalse(I.getContext()));
121  return true;
122  } else {
123  // The image type is unknown, so we cannot eliminate the intrinsic
124  return false;
125  }
126 }
127 
128 bool NVPTXImageOptimizer::replaceIsTypePTexture(Instruction &I) {
129  Value *TexHandle = cleanupValue(I.getOperand(0));
130  if (isImageReadOnly(*TexHandle)) {
131  // This is an OpenCL read-only image, so it must be a texref
132  replaceWith(&I, ConstantInt::getTrue(I.getContext()));
133  return true;
134  } else if (isImageWriteOnly(*TexHandle) ||
135  isImageReadWrite(*TexHandle) ||
136  isSampler(*TexHandle)) {
137  // This is an OpenCL read-write/write-only image or a sampler, so it
138  // cannot be a texref
139  replaceWith(&I, ConstantInt::getFalse(I.getContext()));
140  return true;
141  } else {
142  // The image type is unknown, so we cannot eliminate the intrinsic
143  return false;
144  }
145 }
146 
147 void NVPTXImageOptimizer::replaceWith(Instruction *From, ConstantInt *To) {
148  // We implement "poor man's DCE" here to make sure any code that is no longer
149  // live is actually unreachable and can be trivially eliminated by the
150  // unreachable block elimination pass.
151  for (CallInst::use_iterator UI = From->use_begin(), UE = From->use_end();
152  UI != UE; ++UI) {
153  if (BranchInst *BI = dyn_cast<BranchInst>(*UI)) {
154  if (BI->isUnconditional()) continue;
155  BasicBlock *Dest;
156  if (To->isZero())
157  // Get false block
158  Dest = BI->getSuccessor(1);
159  else
160  // Get true block
161  Dest = BI->getSuccessor(0);
162  BranchInst::Create(Dest, BI);
163  InstrToDelete.push_back(BI);
164  }
165  }
166  From->replaceAllUsesWith(To);
167  InstrToDelete.push_back(From);
168 }
169 
170 Value *NVPTXImageOptimizer::cleanupValue(Value *V) {
171  if (ExtractValueInst *EVI = dyn_cast<ExtractValueInst>(V)) {
172  return cleanupValue(EVI->getAggregateOperand());
173  }
174  return V;
175 }
176 
178  return new NVPTXImageOptimizer();
179 }
bool isIntrinsic() const
isIntrinsic - Returns true if the function&#39;s name starts with "llvm.".
Definition: Function.h:199
use_iterator use_end()
Definition: Value.h:347
This instruction extracts a struct member or array element value from an aggregate value...
This class represents lattice values for constants.
Definition: AllocatorList.h:24
iterator end()
Definition: Function.h:658
This class represents a function call, abstracting a target machine&#39;s calling convention.
LLVMContext & getContext() const
All values hold a context through their type.
Definition: Value.cpp:705
F(f)
static Constant * getTrue(Type *Ty)
For a boolean type or a vector of boolean type, return true or a vector with every element true...
void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
Definition: Value.cpp:429
FunctionPass * createNVPTXImageOptimizerPass()
iterator begin()
Definition: Function.h:656
bool isSampler(const Value &val)
Value * getOperand(unsigned i) const
Definition: User.h:170
static bool runOnFunction(Function &F, bool PostInlining)
LLVM Basic Block Representation.
Definition: BasicBlock.h:58
Conditional or Unconditional Branch instruction.
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
FunctionPass class - This class is used to implement most global optimizations.
Definition: Pass.h:285
bool isImage(const Value &val)
Iterator for intrusive lists based on ilist_node.
This is the shared class of boolean and integer constants.
Definition: Constants.h:84
BlockVerifier::State From
This is a &#39;vector&#39; (really, a variable-sized array), optimized for the case when the array is small...
Definition: SmallVector.h:847
Module.h This file contains the declarations for the Module class.
bool isImageReadWrite(const Value &val)
Intrinsic::ID getIntrinsicID() const LLVM_READONLY
getIntrinsicID - This method returns the ID number of the specified function, or Intrinsic::not_intri...
Definition: Function.h:194
static Constant * getFalse(Type *Ty)
For a boolean type or a vector of boolean type, return false or a vector with every element false...
use_iterator use_begin()
Definition: Value.h:339
bool isImageReadOnly(const Value &val)
#define I(x, y, z)
Definition: MD5.cpp:58
bool isZero() const
This is just a convenience method to make client code smaller for a common code.
Definition: Constants.h:193
LLVM Value Representation.
Definition: Value.h:73
bool isImageWriteOnly(const Value &val)