blob: 12121d7174339bcb58e15d1c371762040877d965 [file] [log] [blame]
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +00001//===- CFLGraph.h - Abstract stratified sets implementation. -----*- C++-*-===//
George Burgess IV02af2782016-07-06 00:36:12 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +00009//
George Burgess IV02af2782016-07-06 00:36:12 +000010/// \file
11/// This file defines CFLGraph, an auxiliary data structure used by CFL-based
12/// alias analysis.
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +000013//
George Burgess IV02af2782016-07-06 00:36:12 +000014//===----------------------------------------------------------------------===//
15
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +000016#ifndef LLVM_LIB_ANALYSIS_CFLGRAPH_H
17#define LLVM_LIB_ANALYSIS_CFLGRAPH_H
George Burgess IV02af2782016-07-06 00:36:12 +000018
George Burgess IVcc48e0f2016-07-06 00:47:21 +000019#include "AliasAnalysisSummary.h"
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +000020#include "llvm/ADT/APInt.h"
21#include "llvm/ADT/DenseMap.h"
22#include "llvm/ADT/SmallVector.h"
23#include "llvm/ADT/iterator_range.h"
George Burgess IV654ec292016-07-09 02:54:42 +000024#include "llvm/Analysis/MemoryBuiltins.h"
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +000025#include "llvm/Analysis/TargetLibraryInfo.h"
26#include "llvm/IR/Argument.h"
27#include "llvm/IR/BasicBlock.h"
28#include "llvm/IR/CallSite.h"
29#include "llvm/IR/Constants.h"
30#include "llvm/IR/DataLayout.h"
31#include "llvm/IR/Function.h"
32#include "llvm/IR/GlobalValue.h"
George Burgess IV654ec292016-07-09 02:54:42 +000033#include "llvm/IR/InstVisitor.h"
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +000034#include "llvm/IR/InstrTypes.h"
35#include "llvm/IR/Instruction.h"
George Burgess IV654ec292016-07-09 02:54:42 +000036#include "llvm/IR/Instructions.h"
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +000037#include "llvm/IR/Operator.h"
38#include "llvm/IR/Type.h"
39#include "llvm/IR/Value.h"
40#include "llvm/Support/Casting.h"
41#include "llvm/Support/ErrorHandling.h"
42#include <cassert>
43#include <cstdint>
44#include <vector>
George Burgess IV02af2782016-07-06 00:36:12 +000045
46namespace llvm {
George Burgess IV02af2782016-07-06 00:36:12 +000047namespace cflaa {
George Burgess IV02af2782016-07-06 00:36:12 +000048
Adrian Prantl26b584c2018-05-01 15:54:18 +000049/// The Program Expression Graph (PEG) of CFL analysis
George Burgess IV02af2782016-07-06 00:36:12 +000050/// CFLGraph is auxiliary data structure used by CFL-based alias analysis to
51/// describe flow-insensitive pointer-related behaviors. Given an LLVM function,
52/// the main purpose of this graph is to abstract away unrelated facts and
53/// translate the rest into a form that can be easily digested by CFL analyses.
George Burgess IV9e937062016-07-11 22:59:09 +000054/// Each Node in the graph is an InstantiatedValue, and each edge represent a
55/// pointer assignment between InstantiatedValue. Pointer
56/// references/dereferences are not explicitly stored in the graph: we
57/// implicitly assume that for each node (X, I) it has a dereference edge to (X,
58/// I+1) and a reference edge to (X, I-1).
George Burgess IV02af2782016-07-06 00:36:12 +000059class CFLGraph {
George Burgess IV9e937062016-07-11 22:59:09 +000060public:
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +000061 using Node = InstantiatedValue;
George Burgess IV02af2782016-07-06 00:36:12 +000062
63 struct Edge {
George Burgess IV02af2782016-07-06 00:36:12 +000064 Node Other;
George Burgess IV55033b02018-05-17 21:56:39 +000065 int64_t Offset;
George Burgess IV02af2782016-07-06 00:36:12 +000066 };
67
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +000068 using EdgeList = std::vector<Edge>;
George Burgess IV02af2782016-07-06 00:36:12 +000069
70 struct NodeInfo {
George Burgess IV723a3ff2016-07-15 19:53:25 +000071 EdgeList Edges, ReverseEdges;
George Burgess IVcc48e0f2016-07-06 00:47:21 +000072 AliasAttrs Attr;
George Burgess IV02af2782016-07-06 00:36:12 +000073 };
74
George Burgess IV9e937062016-07-11 22:59:09 +000075 class ValueInfo {
76 std::vector<NodeInfo> Levels;
George Burgess IV02af2782016-07-06 00:36:12 +000077
George Burgess IV9e937062016-07-11 22:59:09 +000078 public:
79 bool addNodeToLevel(unsigned Level) {
80 auto NumLevels = Levels.size();
81 if (NumLevels > Level)
82 return false;
83 Levels.resize(Level + 1);
84 return true;
George Burgess IV02af2782016-07-06 00:36:12 +000085 }
George Burgess IV9e937062016-07-11 22:59:09 +000086
87 NodeInfo &getNodeInfoAtLevel(unsigned Level) {
88 assert(Level < Levels.size());
89 return Levels[Level];
90 }
91 const NodeInfo &getNodeInfoAtLevel(unsigned Level) const {
92 assert(Level < Levels.size());
93 return Levels[Level];
94 }
95
96 unsigned getNumLevels() const { return Levels.size(); }
97 };
98
99private:
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +0000100 using ValueMap = DenseMap<Value *, ValueInfo>;
101
George Burgess IV9e937062016-07-11 22:59:09 +0000102 ValueMap ValueImpls;
George Burgess IV02af2782016-07-06 00:36:12 +0000103
George Burgess IV02af2782016-07-06 00:36:12 +0000104 NodeInfo *getNode(Node N) {
George Burgess IV9e937062016-07-11 22:59:09 +0000105 auto Itr = ValueImpls.find(N.Val);
106 if (Itr == ValueImpls.end() || Itr->second.getNumLevels() <= N.DerefLevel)
George Burgess IV02af2782016-07-06 00:36:12 +0000107 return nullptr;
George Burgess IV9e937062016-07-11 22:59:09 +0000108 return &Itr->second.getNodeInfoAtLevel(N.DerefLevel);
George Burgess IV02af2782016-07-06 00:36:12 +0000109 }
110
George Burgess IV02af2782016-07-06 00:36:12 +0000111public:
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +0000112 using const_value_iterator = ValueMap::const_iterator;
George Burgess IV02af2782016-07-06 00:36:12 +0000113
George Burgess IV9e937062016-07-11 22:59:09 +0000114 bool addNode(Node N, AliasAttrs Attr = AliasAttrs()) {
115 assert(N.Val != nullptr);
116 auto &ValInfo = ValueImpls[N.Val];
117 auto Changed = ValInfo.addNodeToLevel(N.DerefLevel);
118 ValInfo.getNodeInfoAtLevel(N.DerefLevel).Attr |= Attr;
119 return Changed;
George Burgess IV02af2782016-07-06 00:36:12 +0000120 }
121
George Burgess IVcc48e0f2016-07-06 00:47:21 +0000122 void addAttr(Node N, AliasAttrs Attr) {
George Burgess IV02af2782016-07-06 00:36:12 +0000123 auto *Info = getNode(N);
124 assert(Info != nullptr);
125 Info->Attr |= Attr;
126 }
127
George Burgess IV55033b02018-05-17 21:56:39 +0000128 void addEdge(Node From, Node To, int64_t Offset = 0) {
George Burgess IV02af2782016-07-06 00:36:12 +0000129 auto *FromInfo = getNode(From);
130 assert(FromInfo != nullptr);
George Burgess IV723a3ff2016-07-15 19:53:25 +0000131 auto *ToInfo = getNode(To);
132 assert(ToInfo != nullptr);
133
George Burgess IV7a905f92016-07-20 22:53:30 +0000134 FromInfo->Edges.push_back(Edge{To, Offset});
135 ToInfo->ReverseEdges.push_back(Edge{From, Offset});
George Burgess IV723a3ff2016-07-15 19:53:25 +0000136 }
137
138 const NodeInfo *getNode(Node N) const {
139 auto Itr = ValueImpls.find(N.Val);
140 if (Itr == ValueImpls.end() || Itr->second.getNumLevels() <= N.DerefLevel)
141 return nullptr;
142 return &Itr->second.getNodeInfoAtLevel(N.DerefLevel);
George Burgess IV02af2782016-07-06 00:36:12 +0000143 }
144
George Burgess IVcc48e0f2016-07-06 00:47:21 +0000145 AliasAttrs attrFor(Node N) const {
George Burgess IV02af2782016-07-06 00:36:12 +0000146 auto *Info = getNode(N);
147 assert(Info != nullptr);
148 return Info->Attr;
149 }
150
George Burgess IV9e937062016-07-11 22:59:09 +0000151 iterator_range<const_value_iterator> value_mappings() const {
152 return make_range<const_value_iterator>(ValueImpls.begin(),
153 ValueImpls.end());
George Burgess IV02af2782016-07-06 00:36:12 +0000154 }
George Burgess IV02af2782016-07-06 00:36:12 +0000155};
George Burgess IV654ec292016-07-09 02:54:42 +0000156
Adrian Prantl26b584c2018-05-01 15:54:18 +0000157///A builder class used to create CFLGraph instance from a given function
George Burgess IV654ec292016-07-09 02:54:42 +0000158/// The CFL-AA that uses this builder must provide its own type as a template
159/// argument. This is necessary for interprocedural processing: CFLGraphBuilder
160/// needs a way of obtaining the summary of other functions when callinsts are
161/// encountered.
162/// As a result, we expect the said CFL-AA to expose a getAliasSummary() public
163/// member function that takes a Function& and returns the corresponding summary
164/// as a const AliasSummary*.
165template <typename CFLAA> class CFLGraphBuilder {
166 // Input of the builder
167 CFLAA &Analysis;
168 const TargetLibraryInfo &TLI;
169
170 // Output of the builder
171 CFLGraph Graph;
172 SmallVector<Value *, 4> ReturnedValues;
173
George Burgess IV654ec292016-07-09 02:54:42 +0000174 // Helper class
175 /// Gets the edges our graph should have, based on an Instruction*
176 class GetEdgesVisitor : public InstVisitor<GetEdgesVisitor, void> {
177 CFLAA &AA;
George Burgess IV7a905f92016-07-20 22:53:30 +0000178 const DataLayout &DL;
George Burgess IV654ec292016-07-09 02:54:42 +0000179 const TargetLibraryInfo &TLI;
180
181 CFLGraph &Graph;
182 SmallVectorImpl<Value *> &ReturnValues;
George Burgess IV654ec292016-07-09 02:54:42 +0000183
184 static bool hasUsefulEdges(ConstantExpr *CE) {
185 // ConstantExpr doesn't have terminators, invokes, or fences, so only
186 // needs
187 // to check for compares.
188 return CE->getOpcode() != Instruction::ICmp &&
189 CE->getOpcode() != Instruction::FCmp;
190 }
191
192 // Returns possible functions called by CS into the given SmallVectorImpl.
193 // Returns true if targets found, false otherwise.
194 static bool getPossibleTargets(CallSite CS,
195 SmallVectorImpl<Function *> &Output) {
196 if (auto *Fn = CS.getCalledFunction()) {
197 Output.push_back(Fn);
198 return true;
199 }
200
201 // TODO: If the call is indirect, we might be able to enumerate all
202 // potential
203 // targets of the call and return them, rather than just failing.
204 return false;
205 }
206
George Burgess IV9e937062016-07-11 22:59:09 +0000207 void addNode(Value *Val, AliasAttrs Attr = AliasAttrs()) {
208 assert(Val != nullptr && Val->getType()->isPointerTy());
209 if (auto GVal = dyn_cast<GlobalValue>(Val)) {
210 if (Graph.addNode(InstantiatedValue{GVal, 0},
211 getGlobalOrArgAttrFromValue(*GVal)))
212 Graph.addNode(InstantiatedValue{GVal, 1}, getAttrUnknown());
213 } else if (auto CExpr = dyn_cast<ConstantExpr>(Val)) {
214 if (hasUsefulEdges(CExpr)) {
215 if (Graph.addNode(InstantiatedValue{CExpr, 0}))
216 visitConstantExpr(CExpr);
217 }
218 } else
219 Graph.addNode(InstantiatedValue{Val, 0}, Attr);
George Burgess IV654ec292016-07-09 02:54:42 +0000220 }
221
George Burgess IV55033b02018-05-17 21:56:39 +0000222 void addAssignEdge(Value *From, Value *To, int64_t Offset = 0) {
George Burgess IV654ec292016-07-09 02:54:42 +0000223 assert(From != nullptr && To != nullptr);
224 if (!From->getType()->isPointerTy() || !To->getType()->isPointerTy())
225 return;
226 addNode(From);
George Burgess IV9e937062016-07-11 22:59:09 +0000227 if (To != From) {
George Burgess IV654ec292016-07-09 02:54:42 +0000228 addNode(To);
George Burgess IV9e937062016-07-11 22:59:09 +0000229 Graph.addEdge(InstantiatedValue{From, 0}, InstantiatedValue{To, 0},
230 Offset);
231 }
232 }
233
George Burgess IV723a3ff2016-07-15 19:53:25 +0000234 void addDerefEdge(Value *From, Value *To, bool IsRead) {
George Burgess IV9e937062016-07-11 22:59:09 +0000235 assert(From != nullptr && To != nullptr);
George Burgess IV4e7dec82017-05-31 02:35:26 +0000236 // FIXME: This is subtly broken, due to how we model some instructions
237 // (e.g. extractvalue, extractelement) as loads. Since those take
238 // non-pointer operands, we'll entirely skip adding edges for those.
239 //
240 // addAssignEdge seems to have a similar issue with insertvalue, etc.
George Burgess IV9e937062016-07-11 22:59:09 +0000241 if (!From->getType()->isPointerTy() || !To->getType()->isPointerTy())
242 return;
243 addNode(From);
244 addNode(To);
George Burgess IV723a3ff2016-07-15 19:53:25 +0000245 if (IsRead) {
246 Graph.addNode(InstantiatedValue{From, 1});
247 Graph.addEdge(InstantiatedValue{From, 1}, InstantiatedValue{To, 0});
248 } else {
249 Graph.addNode(InstantiatedValue{To, 1});
250 Graph.addEdge(InstantiatedValue{From, 0}, InstantiatedValue{To, 1});
251 }
George Burgess IV654ec292016-07-09 02:54:42 +0000252 }
253
George Burgess IV723a3ff2016-07-15 19:53:25 +0000254 void addLoadEdge(Value *From, Value *To) { addDerefEdge(From, To, true); }
255 void addStoreEdge(Value *From, Value *To) { addDerefEdge(From, To, false); }
256
George Burgess IV654ec292016-07-09 02:54:42 +0000257 public:
George Burgess IV7a905f92016-07-20 22:53:30 +0000258 GetEdgesVisitor(CFLGraphBuilder &Builder, const DataLayout &DL)
259 : AA(Builder.Analysis), DL(DL), TLI(Builder.TLI), Graph(Builder.Graph),
George Burgess IV9e937062016-07-11 22:59:09 +0000260 ReturnValues(Builder.ReturnedValues) {}
George Burgess IV654ec292016-07-09 02:54:42 +0000261
262 void visitInstruction(Instruction &) {
263 llvm_unreachable("Unsupported instruction encountered");
264 }
265
266 void visitReturnInst(ReturnInst &Inst) {
267 if (auto RetVal = Inst.getReturnValue()) {
268 if (RetVal->getType()->isPointerTy()) {
269 addNode(RetVal);
270 ReturnValues.push_back(RetVal);
271 }
272 }
273 }
274
275 void visitPtrToIntInst(PtrToIntInst &Inst) {
276 auto *Ptr = Inst.getOperand(0);
George Burgess IV9e937062016-07-11 22:59:09 +0000277 addNode(Ptr, getAttrEscaped());
George Burgess IV654ec292016-07-09 02:54:42 +0000278 }
279
280 void visitIntToPtrInst(IntToPtrInst &Inst) {
281 auto *Ptr = &Inst;
George Burgess IV9e937062016-07-11 22:59:09 +0000282 addNode(Ptr, getAttrUnknown());
George Burgess IV654ec292016-07-09 02:54:42 +0000283 }
284
285 void visitCastInst(CastInst &Inst) {
286 auto *Src = Inst.getOperand(0);
George Burgess IV9e937062016-07-11 22:59:09 +0000287 addAssignEdge(Src, &Inst);
George Burgess IV654ec292016-07-09 02:54:42 +0000288 }
289
290 void visitBinaryOperator(BinaryOperator &Inst) {
291 auto *Op1 = Inst.getOperand(0);
292 auto *Op2 = Inst.getOperand(1);
George Burgess IV9e937062016-07-11 22:59:09 +0000293 addAssignEdge(Op1, &Inst);
294 addAssignEdge(Op2, &Inst);
George Burgess IV654ec292016-07-09 02:54:42 +0000295 }
296
297 void visitAtomicCmpXchgInst(AtomicCmpXchgInst &Inst) {
298 auto *Ptr = Inst.getPointerOperand();
299 auto *Val = Inst.getNewValOperand();
George Burgess IV723a3ff2016-07-15 19:53:25 +0000300 addStoreEdge(Val, Ptr);
George Burgess IV654ec292016-07-09 02:54:42 +0000301 }
302
303 void visitAtomicRMWInst(AtomicRMWInst &Inst) {
304 auto *Ptr = Inst.getPointerOperand();
305 auto *Val = Inst.getValOperand();
George Burgess IV723a3ff2016-07-15 19:53:25 +0000306 addStoreEdge(Val, Ptr);
George Burgess IV654ec292016-07-09 02:54:42 +0000307 }
308
309 void visitPHINode(PHINode &Inst) {
310 for (Value *Val : Inst.incoming_values())
George Burgess IV9e937062016-07-11 22:59:09 +0000311 addAssignEdge(Val, &Inst);
George Burgess IV654ec292016-07-09 02:54:42 +0000312 }
313
George Burgess IV7a905f92016-07-20 22:53:30 +0000314 void visitGEP(GEPOperator &GEPOp) {
George Burgess IV55033b02018-05-17 21:56:39 +0000315 uint64_t Offset = UnknownOffset;
George Burgess IV7a905f92016-07-20 22:53:30 +0000316 APInt APOffset(DL.getPointerSizeInBits(GEPOp.getPointerAddressSpace()),
317 0);
318 if (GEPOp.accumulateConstantOffset(DL, APOffset))
319 Offset = APOffset.getSExtValue();
320
321 auto *Op = GEPOp.getPointerOperand();
322 addAssignEdge(Op, &GEPOp, Offset);
323 }
324
George Burgess IV654ec292016-07-09 02:54:42 +0000325 void visitGetElementPtrInst(GetElementPtrInst &Inst) {
George Burgess IV7a905f92016-07-20 22:53:30 +0000326 auto *GEPOp = cast<GEPOperator>(&Inst);
327 visitGEP(*GEPOp);
George Burgess IV654ec292016-07-09 02:54:42 +0000328 }
329
330 void visitSelectInst(SelectInst &Inst) {
331 // Condition is not processed here (The actual statement producing
332 // the condition result is processed elsewhere). For select, the
333 // condition is evaluated, but not loaded, stored, or assigned
334 // simply as a result of being the condition of a select.
335
336 auto *TrueVal = Inst.getTrueValue();
337 auto *FalseVal = Inst.getFalseValue();
George Burgess IV9e937062016-07-11 22:59:09 +0000338 addAssignEdge(TrueVal, &Inst);
339 addAssignEdge(FalseVal, &Inst);
George Burgess IV654ec292016-07-09 02:54:42 +0000340 }
341
George Burgess IV9e937062016-07-11 22:59:09 +0000342 void visitAllocaInst(AllocaInst &Inst) { addNode(&Inst); }
George Burgess IV654ec292016-07-09 02:54:42 +0000343
344 void visitLoadInst(LoadInst &Inst) {
345 auto *Ptr = Inst.getPointerOperand();
346 auto *Val = &Inst;
George Burgess IV723a3ff2016-07-15 19:53:25 +0000347 addLoadEdge(Ptr, Val);
George Burgess IV654ec292016-07-09 02:54:42 +0000348 }
349
350 void visitStoreInst(StoreInst &Inst) {
351 auto *Ptr = Inst.getPointerOperand();
352 auto *Val = Inst.getValueOperand();
George Burgess IV723a3ff2016-07-15 19:53:25 +0000353 addStoreEdge(Val, Ptr);
George Burgess IV654ec292016-07-09 02:54:42 +0000354 }
355
356 void visitVAArgInst(VAArgInst &Inst) {
357 // We can't fully model va_arg here. For *Ptr = Inst.getOperand(0), it
358 // does
359 // two things:
360 // 1. Loads a value from *((T*)*Ptr).
361 // 2. Increments (stores to) *Ptr by some target-specific amount.
362 // For now, we'll handle this like a landingpad instruction (by placing
363 // the
364 // result in its own group, and having that group alias externals).
George Burgess IV450453a2016-07-29 01:23:45 +0000365 if (Inst.getType()->isPointerTy())
366 addNode(&Inst, getAttrUnknown());
George Burgess IV654ec292016-07-09 02:54:42 +0000367 }
368
369 static bool isFunctionExternal(Function *Fn) {
370 return !Fn->hasExactDefinition();
371 }
372
373 bool tryInterproceduralAnalysis(CallSite CS,
374 const SmallVectorImpl<Function *> &Fns) {
375 assert(Fns.size() > 0);
376
377 if (CS.arg_size() > MaxSupportedArgsInSummary)
378 return false;
379
380 // Exit early if we'll fail anyway
381 for (auto *Fn : Fns) {
382 if (isFunctionExternal(Fn) || Fn->isVarArg())
383 return false;
384 // Fail if the caller does not provide enough arguments
385 assert(Fn->arg_size() <= CS.arg_size());
386 if (!AA.getAliasSummary(*Fn))
387 return false;
388 }
389
390 for (auto *Fn : Fns) {
391 auto Summary = AA.getAliasSummary(*Fn);
392 assert(Summary != nullptr);
393
394 auto &RetParamRelations = Summary->RetParamRelations;
395 for (auto &Relation : RetParamRelations) {
396 auto IRelation = instantiateExternalRelation(Relation, CS);
George Burgess IV9e937062016-07-11 22:59:09 +0000397 if (IRelation.hasValue()) {
398 Graph.addNode(IRelation->From);
399 Graph.addNode(IRelation->To);
George Burgess IV55033b02018-05-17 21:56:39 +0000400 Graph.addEdge(IRelation->From, IRelation->To);
George Burgess IV9e937062016-07-11 22:59:09 +0000401 }
George Burgess IV654ec292016-07-09 02:54:42 +0000402 }
403
404 auto &RetParamAttributes = Summary->RetParamAttributes;
405 for (auto &Attribute : RetParamAttributes) {
406 auto IAttr = instantiateExternalAttribute(Attribute, CS);
407 if (IAttr.hasValue())
George Burgess IV9e937062016-07-11 22:59:09 +0000408 Graph.addNode(IAttr->IValue, IAttr->Attr);
George Burgess IV654ec292016-07-09 02:54:42 +0000409 }
410 }
411
412 return true;
413 }
414
415 void visitCallSite(CallSite CS) {
416 auto Inst = CS.getInstruction();
417
418 // Make sure all arguments and return value are added to the graph first
419 for (Value *V : CS.args())
George Burgess IV9e937062016-07-11 22:59:09 +0000420 if (V->getType()->isPointerTy())
421 addNode(V);
George Burgess IV654ec292016-07-09 02:54:42 +0000422 if (Inst->getType()->isPointerTy())
423 addNode(Inst);
424
425 // Check if Inst is a call to a library function that
George Burgess IV758389d2018-05-26 02:17:43 +0000426 // allocates/deallocates on the heap. Those kinds of functions do not
427 // introduce any aliases.
George Burgess IV654ec292016-07-09 02:54:42 +0000428 // TODO: address other common library functions such as realloc(),
George Burgess IV758389d2018-05-26 02:17:43 +0000429 // strdup(), etc.
Craig Toppera8fe21d2017-04-18 21:43:46 +0000430 if (isMallocOrCallocLikeFn(Inst, &TLI) || isFreeCall(Inst, &TLI))
George Burgess IV654ec292016-07-09 02:54:42 +0000431 return;
432
433 // TODO: Add support for noalias args/all the other fun function
George Burgess IV758389d2018-05-26 02:17:43 +0000434 // attributes that we can tack on.
George Burgess IV654ec292016-07-09 02:54:42 +0000435 SmallVector<Function *, 4> Targets;
436 if (getPossibleTargets(CS, Targets))
437 if (tryInterproceduralAnalysis(CS, Targets))
438 return;
439
440 // Because the function is opaque, we need to note that anything
441 // could have happened to the arguments (unless the function is marked
442 // readonly or readnone), and that the result could alias just about
443 // anything, too (unless the result is marked noalias).
444 if (!CS.onlyReadsMemory())
445 for (Value *V : CS.args()) {
446 if (V->getType()->isPointerTy()) {
447 // The argument itself escapes.
George Burgess IV9e937062016-07-11 22:59:09 +0000448 Graph.addAttr(InstantiatedValue{V, 0}, getAttrEscaped());
George Burgess IV654ec292016-07-09 02:54:42 +0000449 // The fate of argument memory is unknown. Note that since
George Burgess IV9e937062016-07-11 22:59:09 +0000450 // AliasAttrs is transitive with respect to dereference, we only
451 // need to specify it for the first-level memory.
452 Graph.addNode(InstantiatedValue{V, 1}, getAttrUnknown());
George Burgess IV654ec292016-07-09 02:54:42 +0000453 }
454 }
455
456 if (Inst->getType()->isPointerTy()) {
457 auto *Fn = CS.getCalledFunction();
Reid Klecknera82b3762017-05-03 18:17:31 +0000458 if (Fn == nullptr || !Fn->returnDoesNotAlias())
George Burgess IV9e937062016-07-11 22:59:09 +0000459 // No need to call addNode() since we've added Inst at the
George Burgess IV654ec292016-07-09 02:54:42 +0000460 // beginning of this function and we know it is not a global.
George Burgess IV9e937062016-07-11 22:59:09 +0000461 Graph.addAttr(InstantiatedValue{Inst, 0}, getAttrUnknown());
George Burgess IV654ec292016-07-09 02:54:42 +0000462 }
463 }
464
465 /// Because vectors/aggregates are immutable and unaddressable, there's
466 /// nothing we can do to coax a value out of them, other than calling
467 /// Extract{Element,Value}. We can effectively treat them as pointers to
468 /// arbitrary memory locations we can store in and load from.
469 void visitExtractElementInst(ExtractElementInst &Inst) {
470 auto *Ptr = Inst.getVectorOperand();
471 auto *Val = &Inst;
George Burgess IV723a3ff2016-07-15 19:53:25 +0000472 addLoadEdge(Ptr, Val);
George Burgess IV654ec292016-07-09 02:54:42 +0000473 }
474
475 void visitInsertElementInst(InsertElementInst &Inst) {
476 auto *Vec = Inst.getOperand(0);
477 auto *Val = Inst.getOperand(1);
George Burgess IV9e937062016-07-11 22:59:09 +0000478 addAssignEdge(Vec, &Inst);
George Burgess IV723a3ff2016-07-15 19:53:25 +0000479 addStoreEdge(Val, &Inst);
George Burgess IV654ec292016-07-09 02:54:42 +0000480 }
481
482 void visitLandingPadInst(LandingPadInst &Inst) {
483 // Exceptions come from "nowhere", from our analysis' perspective.
484 // So we place the instruction its own group, noting that said group may
485 // alias externals
George Burgess IV450453a2016-07-29 01:23:45 +0000486 if (Inst.getType()->isPointerTy())
487 addNode(&Inst, getAttrUnknown());
George Burgess IV654ec292016-07-09 02:54:42 +0000488 }
489
490 void visitInsertValueInst(InsertValueInst &Inst) {
491 auto *Agg = Inst.getOperand(0);
492 auto *Val = Inst.getOperand(1);
George Burgess IV9e937062016-07-11 22:59:09 +0000493 addAssignEdge(Agg, &Inst);
George Burgess IV723a3ff2016-07-15 19:53:25 +0000494 addStoreEdge(Val, &Inst);
George Burgess IV654ec292016-07-09 02:54:42 +0000495 }
496
497 void visitExtractValueInst(ExtractValueInst &Inst) {
498 auto *Ptr = Inst.getAggregateOperand();
George Burgess IV723a3ff2016-07-15 19:53:25 +0000499 addLoadEdge(Ptr, &Inst);
George Burgess IV654ec292016-07-09 02:54:42 +0000500 }
501
502 void visitShuffleVectorInst(ShuffleVectorInst &Inst) {
503 auto *From1 = Inst.getOperand(0);
504 auto *From2 = Inst.getOperand(1);
George Burgess IV9e937062016-07-11 22:59:09 +0000505 addAssignEdge(From1, &Inst);
506 addAssignEdge(From2, &Inst);
George Burgess IV654ec292016-07-09 02:54:42 +0000507 }
508
509 void visitConstantExpr(ConstantExpr *CE) {
510 switch (CE->getOpcode()) {
George Burgess IV7a905f92016-07-20 22:53:30 +0000511 case Instruction::GetElementPtr: {
512 auto GEPOp = cast<GEPOperator>(CE);
513 visitGEP(*GEPOp);
514 break;
515 }
David Bolvansky090f8152018-05-01 21:35:32 +0000516
George Burgess IV7a905f92016-07-20 22:53:30 +0000517 case Instruction::PtrToInt: {
David Bolvansky090f8152018-05-01 21:35:32 +0000518 addNode(CE->getOperand(0), getAttrEscaped());
George Burgess IV7a905f92016-07-20 22:53:30 +0000519 break;
520 }
David Bolvansky090f8152018-05-01 21:35:32 +0000521
522 case Instruction::IntToPtr: {
George Burgess IV7a905f92016-07-20 22:53:30 +0000523 addNode(CE, getAttrUnknown());
524 break;
David Bolvansky090f8152018-05-01 21:35:32 +0000525 }
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +0000526
George Burgess IV7a905f92016-07-20 22:53:30 +0000527 case Instruction::BitCast:
528 case Instruction::AddrSpaceCast:
529 case Instruction::Trunc:
530 case Instruction::ZExt:
531 case Instruction::SExt:
532 case Instruction::FPExt:
533 case Instruction::FPTrunc:
534 case Instruction::UIToFP:
535 case Instruction::SIToFP:
536 case Instruction::FPToUI:
537 case Instruction::FPToSI: {
David Bolvansky090f8152018-05-01 21:35:32 +0000538 addAssignEdge(CE->getOperand(0), CE);
George Burgess IV7a905f92016-07-20 22:53:30 +0000539 break;
540 }
David Bolvansky090f8152018-05-01 21:35:32 +0000541
David Bolvansky74080eb2018-05-10 11:47:36 +0000542 case Instruction::Select: {
543 addAssignEdge(CE->getOperand(1), CE);
544 addAssignEdge(CE->getOperand(2), CE);
545 break;
546 }
547
David Bolvansky090f8152018-05-01 21:35:32 +0000548 case Instruction::InsertElement:
George Burgess IV7a905f92016-07-20 22:53:30 +0000549 case Instruction::InsertValue: {
David Bolvansky090f8152018-05-01 21:35:32 +0000550 addAssignEdge(CE->getOperand(0), CE);
551 addStoreEdge(CE->getOperand(1), CE);
George Burgess IV7a905f92016-07-20 22:53:30 +0000552 break;
553 }
David Bolvansky090f8152018-05-01 21:35:32 +0000554
555 case Instruction::ExtractElement:
George Burgess IV7a905f92016-07-20 22:53:30 +0000556 case Instruction::ExtractValue: {
David Bolvansky090f8152018-05-01 21:35:32 +0000557 addLoadEdge(CE->getOperand(0), CE);
George Burgess IV4e7dec82017-05-31 02:35:26 +0000558 break;
George Burgess IV7a905f92016-07-20 22:53:30 +0000559 }
David Bolvansky090f8152018-05-01 21:35:32 +0000560
George Burgess IV7a905f92016-07-20 22:53:30 +0000561 case Instruction::Add:
562 case Instruction::Sub:
563 case Instruction::FSub:
564 case Instruction::Mul:
565 case Instruction::FMul:
566 case Instruction::UDiv:
567 case Instruction::SDiv:
568 case Instruction::FDiv:
569 case Instruction::URem:
570 case Instruction::SRem:
571 case Instruction::FRem:
572 case Instruction::And:
573 case Instruction::Or:
574 case Instruction::Xor:
575 case Instruction::Shl:
576 case Instruction::LShr:
577 case Instruction::AShr:
578 case Instruction::ICmp:
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +0000579 case Instruction::FCmp:
David Bolvansky090f8152018-05-01 21:35:32 +0000580 case Instruction::ShuffleVector: {
George Burgess IV7a905f92016-07-20 22:53:30 +0000581 addAssignEdge(CE->getOperand(0), CE);
582 addAssignEdge(CE->getOperand(1), CE);
583 break;
David Bolvansky090f8152018-05-01 21:35:32 +0000584 }
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +0000585
George Burgess IV654ec292016-07-09 02:54:42 +0000586 default:
587 llvm_unreachable("Unknown instruction type encountered!");
George Burgess IV654ec292016-07-09 02:54:42 +0000588 }
589 }
590 };
591
592 // Helper functions
593
594 // Determines whether or not we an instruction is useless to us (e.g.
595 // FenceInst)
596 static bool hasUsefulEdges(Instruction *Inst) {
Chandler Carruth9179aee2018-08-26 09:51:22 +0000597 bool IsNonInvokeRetTerminator = Inst->isTerminator() &&
George Burgess IV654ec292016-07-09 02:54:42 +0000598 !isa<InvokeInst>(Inst) &&
599 !isa<ReturnInst>(Inst);
600 return !isa<CmpInst>(Inst) && !isa<FenceInst>(Inst) &&
601 !IsNonInvokeRetTerminator;
602 }
603
604 void addArgumentToGraph(Argument &Arg) {
605 if (Arg.getType()->isPointerTy()) {
George Burgess IV9e937062016-07-11 22:59:09 +0000606 Graph.addNode(InstantiatedValue{&Arg, 0},
607 getGlobalOrArgAttrFromValue(Arg));
George Burgess IV654ec292016-07-09 02:54:42 +0000608 // Pointees of a formal parameter is known to the caller
George Burgess IV9e937062016-07-11 22:59:09 +0000609 Graph.addNode(InstantiatedValue{&Arg, 1}, getAttrCaller());
George Burgess IV654ec292016-07-09 02:54:42 +0000610 }
611 }
612
613 // Given an Instruction, this will add it to the graph, along with any
614 // Instructions that are potentially only available from said Instruction
615 // For example, given the following line:
616 // %0 = load i16* getelementptr ([1 x i16]* @a, 0, 0), align 2
617 // addInstructionToGraph would add both the `load` and `getelementptr`
618 // instructions to the graph appropriately.
George Burgess IV9e937062016-07-11 22:59:09 +0000619 void addInstructionToGraph(GetEdgesVisitor &Visitor, Instruction &Inst) {
George Burgess IV654ec292016-07-09 02:54:42 +0000620 if (!hasUsefulEdges(&Inst))
621 return;
622
George Burgess IV9e937062016-07-11 22:59:09 +0000623 Visitor.visit(Inst);
George Burgess IV654ec292016-07-09 02:54:42 +0000624 }
625
626 // Builds the graph needed for constructing the StratifiedSets for the given
627 // function
628 void buildGraphFrom(Function &Fn) {
George Burgess IV7a905f92016-07-20 22:53:30 +0000629 GetEdgesVisitor Visitor(*this, Fn.getParent()->getDataLayout());
George Burgess IV9e937062016-07-11 22:59:09 +0000630
George Burgess IV654ec292016-07-09 02:54:42 +0000631 for (auto &Bb : Fn.getBasicBlockList())
632 for (auto &Inst : Bb.getInstList())
George Burgess IV9e937062016-07-11 22:59:09 +0000633 addInstructionToGraph(Visitor, Inst);
George Burgess IV654ec292016-07-09 02:54:42 +0000634
635 for (auto &Arg : Fn.args())
636 addArgumentToGraph(Arg);
637 }
638
639public:
640 CFLGraphBuilder(CFLAA &Analysis, const TargetLibraryInfo &TLI, Function &Fn)
641 : Analysis(Analysis), TLI(TLI) {
642 buildGraphFrom(Fn);
643 }
644
645 const CFLGraph &getCFLGraph() const { return Graph; }
646 const SmallVector<Value *, 4> &getReturnValues() const {
647 return ReturnedValues;
648 }
George Burgess IV654ec292016-07-09 02:54:42 +0000649};
George Burgess IV02af2782016-07-06 00:36:12 +0000650
Eugene Zelenkoc5e4ac82017-08-11 21:30:02 +0000651} // end namespace cflaa
652} // end namespace llvm
653
654#endif // LLVM_LIB_ANALYSIS_CFLGRAPH_H