1 //===-- llvm/IR/Statepoint.h - gc.statepoint utilities ------ --*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file contains utility functions and a wrapper class analogous to
11 // CallSite for accessing the fields of gc.statepoint, gc.relocate, and
12 // gc.result intrinsics
13 //
14 //===----------------------------------------------------------------------===//
15 
16 #ifndef LLVM_IR_STATEPOINT_H
17 #define LLVM_IR_STATEPOINT_H
18 
19 #include "llvm/ADT/iterator_range.h"
20 #include "llvm/IR/BasicBlock.h"
21 #include "llvm/IR/CallSite.h"
22 #include "llvm/IR/Constants.h"
23 #include "llvm/IR/Function.h"
24 #include "llvm/IR/Instructions.h"
25 #include "llvm/IR/Intrinsics.h"
26 #include "llvm/Support/Compiler.h"
27 
28 namespace llvm {
29 /// The statepoint intrinsic accepts a set of flags as its third argument.
30 /// Valid values come out of this set.
31 enum class StatepointFlags {
32   None = 0,
33   GCTransition = 1, ///< Indicates that this statepoint is a transition from
34                     ///< GC-aware code to code that is not GC-aware.
35 
36   MaskAll = GCTransition ///< A bitmask that includes all valid flags.
37 };
38 
39 class GCRelocateOperands;
40 class ImmutableStatepoint;
41 
42 bool isStatepoint(const ImmutableCallSite &CS);
43 bool isStatepoint(const Value *V);
44 bool isStatepoint(const Value &V);
45 
46 bool isGCRelocate(const Value *V);
47 bool isGCRelocate(const ImmutableCallSite &CS);
48 
49 bool isGCResult(const Value *V);
50 bool isGCResult(const ImmutableCallSite &CS);
51 
52 /// Analogous to CallSiteBase, this provides most of the actual
53 /// functionality for Statepoint and ImmutableStatepoint.  It is
54 /// templatized to allow easily specializing of const and non-const
55 /// concrete subtypes.  This is structured analogous to CallSite
56 /// rather than the IntrinsicInst.h helpers since we want to support
57 /// invokable statepoints in the near future.
58 template <typename FunTy, typename InstructionTy, typename ValueTy,
59           typename CallSiteTy>
60 class StatepointBase {
61   CallSiteTy StatepointCS;
62   void *operator new(size_t, unsigned) = delete;
63   void *operator new(size_t s) = delete;
64 
65 protected:
StatepointBase(InstructionTy * I)66   explicit StatepointBase(InstructionTy *I) {
67     if (isStatepoint(I)) {
68       StatepointCS = CallSiteTy(I);
69       assert(StatepointCS && "isStatepoint implies CallSite");
70     }
71   }
StatepointBase(CallSiteTy CS)72   explicit StatepointBase(CallSiteTy CS) {
73     if (isStatepoint(CS))
74       StatepointCS = CS;
75   }
76 
77 public:
78   typedef typename CallSiteTy::arg_iterator arg_iterator;
79 
80   enum {
81     IDPos = 0,
82     NumPatchBytesPos = 1,
83     CalledFunctionPos = 2,
84     NumCallArgsPos = 3,
85     FlagsPos = 4,
86     CallArgsBeginPos = 5,
87   };
88 
89   explicit operator bool() const {
90     // We do not assign non-statepoint CallSites to StatepointCS.
91     return (bool)StatepointCS;
92   }
93 
94   /// Return the underlying CallSite.
getCallSite()95   CallSiteTy getCallSite() const {
96     assert(*this && "check validity first!");
97     return StatepointCS;
98   }
99 
getFlags()100   uint64_t getFlags() const {
101     return cast<ConstantInt>(getCallSite().getArgument(FlagsPos))
102         ->getZExtValue();
103   }
104 
105   /// Return the ID associated with this statepoint.
getID()106   uint64_t getID() const {
107     const Value *IDVal = getCallSite().getArgument(IDPos);
108     return cast<ConstantInt>(IDVal)->getZExtValue();
109   }
110 
111   /// Return the number of patchable bytes associated with this statepoint.
getNumPatchBytes()112   uint32_t getNumPatchBytes() const {
113     const Value *NumPatchBytesVal = getCallSite().getArgument(NumPatchBytesPos);
114     uint64_t NumPatchBytes =
115       cast<ConstantInt>(NumPatchBytesVal)->getZExtValue();
116     assert(isInt<32>(NumPatchBytes) && "should fit in 32 bits!");
117     return NumPatchBytes;
118   }
119 
120   /// Return the value actually being called or invoked.
getCalledValue()121   ValueTy *getCalledValue() const {
122     return getCallSite().getArgument(CalledFunctionPos);
123   }
124 
getInstruction()125   InstructionTy *getInstruction() const {
126     return getCallSite().getInstruction();
127   }
128 
129   /// Return the function being called if this is a direct call, otherwise
130   /// return null (if it's an indirect call).
getCalledFunction()131   FunTy *getCalledFunction() const {
132     return dyn_cast<Function>(getCalledValue());
133   }
134 
135   /// Return the caller function for this statepoint.
getCaller()136   FunTy *getCaller() const { return getCallSite().getCaller(); }
137 
138   /// Determine if the statepoint cannot unwind.
doesNotThrow()139   bool doesNotThrow() const {
140     Function *F = getCalledFunction();
141     return getCallSite().doesNotThrow() || (F ? F->doesNotThrow() : false);
142   }
143 
144   /// Return the type of the value returned by the call underlying the
145   /// statepoint.
getActualReturnType()146   Type *getActualReturnType() const {
147     auto *FTy = cast<FunctionType>(
148         cast<PointerType>(getCalledValue()->getType())->getElementType());
149     return FTy->getReturnType();
150   }
151 
152   /// Number of arguments to be passed to the actual callee.
getNumCallArgs()153   int getNumCallArgs() const {
154     const Value *NumCallArgsVal = getCallSite().getArgument(NumCallArgsPos);
155     return cast<ConstantInt>(NumCallArgsVal)->getZExtValue();
156   }
157 
arg_size()158   size_t arg_size() const { return getNumCallArgs(); }
arg_begin()159   typename CallSiteTy::arg_iterator arg_begin() const {
160     assert(CallArgsBeginPos <= (int)getCallSite().arg_size());
161     return getCallSite().arg_begin() + CallArgsBeginPos;
162   }
arg_end()163   typename CallSiteTy::arg_iterator arg_end() const {
164     auto I = arg_begin() + arg_size();
165     assert((getCallSite().arg_end() - I) >= 0);
166     return I;
167   }
168 
getArgument(unsigned Index)169   ValueTy *getArgument(unsigned Index) {
170     assert(Index < arg_size() && "out of bounds!");
171     return *(arg_begin() + Index);
172   }
173 
174   /// range adapter for call arguments
call_args()175   iterator_range<arg_iterator> call_args() const {
176     return make_range(arg_begin(), arg_end());
177   }
178 
179   /// \brief Return true if the call or the callee has the given attribute.
paramHasAttr(unsigned i,Attribute::AttrKind A)180   bool paramHasAttr(unsigned i, Attribute::AttrKind A) const {
181     Function *F = getCalledFunction();
182     return getCallSite().paramHasAttr(i + CallArgsBeginPos, A) ||
183           (F ? F->getAttributes().hasAttribute(i, A) : false);
184   }
185 
186   /// Number of GC transition args.
getNumTotalGCTransitionArgs()187   int getNumTotalGCTransitionArgs() const {
188     const Value *NumGCTransitionArgs = *arg_end();
189     return cast<ConstantInt>(NumGCTransitionArgs)->getZExtValue();
190   }
gc_transition_args_begin()191   typename CallSiteTy::arg_iterator gc_transition_args_begin() const {
192     auto I = arg_end() + 1;
193     assert((getCallSite().arg_end() - I) >= 0);
194     return I;
195   }
gc_transition_args_end()196   typename CallSiteTy::arg_iterator gc_transition_args_end() const {
197     auto I = gc_transition_args_begin() + getNumTotalGCTransitionArgs();
198     assert((getCallSite().arg_end() - I) >= 0);
199     return I;
200   }
201 
202   /// range adapter for GC transition arguments
gc_transition_args()203   iterator_range<arg_iterator> gc_transition_args() const {
204     return make_range(gc_transition_args_begin(), gc_transition_args_end());
205   }
206 
207   /// Number of additional arguments excluding those intended
208   /// for garbage collection.
getNumTotalVMSArgs()209   int getNumTotalVMSArgs() const {
210     const Value *NumVMSArgs = *gc_transition_args_end();
211     return cast<ConstantInt>(NumVMSArgs)->getZExtValue();
212   }
213 
vm_state_begin()214   typename CallSiteTy::arg_iterator vm_state_begin() const {
215     auto I = gc_transition_args_end() + 1;
216     assert((getCallSite().arg_end() - I) >= 0);
217     return I;
218   }
vm_state_end()219   typename CallSiteTy::arg_iterator vm_state_end() const {
220     auto I = vm_state_begin() + getNumTotalVMSArgs();
221     assert((getCallSite().arg_end() - I) >= 0);
222     return I;
223   }
224 
225   /// range adapter for vm state arguments
vm_state_args()226   iterator_range<arg_iterator> vm_state_args() const {
227     return make_range(vm_state_begin(), vm_state_end());
228   }
229 
gc_args_begin()230   typename CallSiteTy::arg_iterator gc_args_begin() const {
231     return vm_state_end();
232   }
gc_args_end()233   typename CallSiteTy::arg_iterator gc_args_end() const {
234     return getCallSite().arg_end();
235   }
236 
gcArgsStartIdx()237   unsigned gcArgsStartIdx() const {
238     return gc_args_begin() - getInstruction()->op_begin();
239   }
240 
241   /// range adapter for gc arguments
gc_args()242   iterator_range<arg_iterator> gc_args() const {
243     return make_range(gc_args_begin(), gc_args_end());
244   }
245 
246   /// Get list of all gc reloactes linked to this statepoint
247   /// May contain several relocations for the same base/derived pair.
248   /// For example this could happen due to relocations on unwinding
249   /// path of invoke.
250   std::vector<GCRelocateOperands> getRelocates() const;
251 
252   /// Get the experimental_gc_result call tied to this statepoint.  Can be
253   /// nullptr if there isn't a gc_result tied to this statepoint.  Guaranteed to
254   /// be a CallInst if non-null.
getGCResult()255   InstructionTy *getGCResult() const {
256     for (auto *U : getInstruction()->users())
257       if (isGCResult(U))
258         return cast<CallInst>(U);
259 
260     return nullptr;
261   }
262 
263 #ifndef NDEBUG
264   /// Asserts if this statepoint is malformed.  Common cases for failure
265   /// include incorrect length prefixes for variable length sections or
266   /// illegal values for parameters.
verify()267   void verify() {
268     assert(getNumCallArgs() >= 0 &&
269            "number of arguments to actually callee can't be negative");
270 
271     // The internal asserts in the iterator accessors do the rest.
272     (void)arg_begin();
273     (void)arg_end();
274     (void)gc_transition_args_begin();
275     (void)gc_transition_args_end();
276     (void)vm_state_begin();
277     (void)vm_state_end();
278     (void)gc_args_begin();
279     (void)gc_args_end();
280   }
281 #endif
282 };
283 
284 /// A specialization of it's base class for read only access
285 /// to a gc.statepoint.
286 class ImmutableStatepoint
287     : public StatepointBase<const Function, const Instruction, const Value,
288                             ImmutableCallSite> {
289   typedef StatepointBase<const Function, const Instruction, const Value,
290                          ImmutableCallSite> Base;
291 
292 public:
ImmutableStatepoint(const Instruction * I)293   explicit ImmutableStatepoint(const Instruction *I) : Base(I) {}
ImmutableStatepoint(ImmutableCallSite CS)294   explicit ImmutableStatepoint(ImmutableCallSite CS) : Base(CS) {}
295 };
296 
297 /// A specialization of it's base class for read-write access
298 /// to a gc.statepoint.
299 class Statepoint
300     : public StatepointBase<Function, Instruction, Value, CallSite> {
301   typedef StatepointBase<Function, Instruction, Value, CallSite> Base;
302 
303 public:
Statepoint(Instruction * I)304   explicit Statepoint(Instruction *I) : Base(I) {}
Statepoint(CallSite CS)305   explicit Statepoint(CallSite CS) : Base(CS) {}
306 };
307 
308 /// Wraps a call to a gc.relocate and provides access to it's operands.
309 /// TODO: This should likely be refactored to resememble the wrappers in
310 /// InstrinsicInst.h.
311 class GCRelocateOperands {
312   ImmutableCallSite RelocateCS;
313 
314 public:
GCRelocateOperands(const User * U)315   GCRelocateOperands(const User *U) : RelocateCS(U) { assert(isGCRelocate(U)); }
GCRelocateOperands(const Instruction * inst)316   GCRelocateOperands(const Instruction *inst) : RelocateCS(inst) {
317     assert(isGCRelocate(inst));
318   }
GCRelocateOperands(CallSite CS)319   GCRelocateOperands(CallSite CS) : RelocateCS(CS) { assert(isGCRelocate(CS)); }
320 
321   /// Return true if this relocate is tied to the invoke statepoint.
322   /// This includes relocates which are on the unwinding path.
isTiedToInvoke()323   bool isTiedToInvoke() const {
324     const Value *Token = RelocateCS.getArgument(0);
325 
326     return isa<ExtractValueInst>(Token) || isa<InvokeInst>(Token);
327   }
328 
329   /// Get enclosed relocate intrinsic
getUnderlyingCallSite()330   ImmutableCallSite getUnderlyingCallSite() { return RelocateCS; }
331 
332   /// The statepoint with which this gc.relocate is associated.
getStatepoint()333   const Instruction *getStatepoint() {
334     const Value *Token = RelocateCS.getArgument(0);
335 
336     // This takes care both of relocates for call statepoints and relocates
337     // on normal path of invoke statepoint.
338     if (!isa<ExtractValueInst>(Token)) {
339       return cast<Instruction>(Token);
340     }
341 
342     // This relocate is on exceptional path of an invoke statepoint
343     const BasicBlock *InvokeBB =
344         cast<Instruction>(Token)->getParent()->getUniquePredecessor();
345 
346     assert(InvokeBB && "safepoints should have unique landingpads");
347     assert(InvokeBB->getTerminator() &&
348            "safepoint block should be well formed");
349     assert(isStatepoint(InvokeBB->getTerminator()));
350 
351     return InvokeBB->getTerminator();
352   }
353 
354   /// The index into the associate statepoint's argument list
355   /// which contains the base pointer of the pointer whose
356   /// relocation this gc.relocate describes.
getBasePtrIndex()357   unsigned getBasePtrIndex() {
358     return cast<ConstantInt>(RelocateCS.getArgument(1))->getZExtValue();
359   }
360 
361   /// The index into the associate statepoint's argument list which
362   /// contains the pointer whose relocation this gc.relocate describes.
getDerivedPtrIndex()363   unsigned getDerivedPtrIndex() {
364     return cast<ConstantInt>(RelocateCS.getArgument(2))->getZExtValue();
365   }
366 
getBasePtr()367   Value *getBasePtr() {
368     ImmutableCallSite CS(getStatepoint());
369     return *(CS.arg_begin() + getBasePtrIndex());
370   }
371 
getDerivedPtr()372   Value *getDerivedPtr() {
373     ImmutableCallSite CS(getStatepoint());
374     return *(CS.arg_begin() + getDerivedPtrIndex());
375   }
376 };
377 
378 template <typename FunTy, typename InstructionTy, typename ValueTy,
379           typename CallSiteTy>
380 std::vector<GCRelocateOperands>
getRelocates()381 StatepointBase<FunTy, InstructionTy, ValueTy, CallSiteTy>::getRelocates()
382     const {
383 
384   std::vector<GCRelocateOperands> Result;
385 
386   CallSiteTy StatepointCS = getCallSite();
387 
388   // Search for relocated pointers.  Note that working backwards from the
389   // gc_relocates ensures that we only get pairs which are actually relocated
390   // and used after the statepoint.
391   for (const User *U : getInstruction()->users())
392     if (isGCRelocate(U))
393       Result.push_back(GCRelocateOperands(U));
394 
395   if (!StatepointCS.isInvoke())
396     return Result;
397 
398   // We need to scan thorough exceptional relocations if it is invoke statepoint
399   LandingPadInst *LandingPad =
400       cast<InvokeInst>(getInstruction())->getLandingPadInst();
401 
402   // Search for extract value from landingpad instruction to which
403   // gc relocates will be attached
404   for (const User *LandingPadUser : LandingPad->users()) {
405     if (!isa<ExtractValueInst>(LandingPadUser))
406       continue;
407 
408     // gc relocates should be attached to this extract value
409     for (const User *U : LandingPadUser->users())
410       if (isGCRelocate(U))
411         Result.push_back(GCRelocateOperands(U));
412   }
413   return Result;
414 }
415 }
416 
417 #endif
418