1 //===--- SemaCUDA.cpp - Semantic Analysis for CUDA constructs -------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 /// \file
10 /// \brief This file implements semantic analysis for CUDA constructs.
11 ///
12 //===----------------------------------------------------------------------===//
13 
14 #include "clang/Sema/Sema.h"
15 #include "clang/AST/ASTContext.h"
16 #include "clang/AST/Decl.h"
17 #include "clang/Lex/Preprocessor.h"
18 #include "clang/Sema/SemaDiagnostic.h"
19 #include "llvm/ADT/Optional.h"
20 #include "llvm/ADT/SmallVector.h"
21 using namespace clang;
22 
ActOnCUDAExecConfigExpr(Scope * S,SourceLocation LLLLoc,MultiExprArg ExecConfig,SourceLocation GGGLoc)23 ExprResult Sema::ActOnCUDAExecConfigExpr(Scope *S, SourceLocation LLLLoc,
24                                          MultiExprArg ExecConfig,
25                                          SourceLocation GGGLoc) {
26   FunctionDecl *ConfigDecl = Context.getcudaConfigureCallDecl();
27   if (!ConfigDecl)
28     return ExprError(Diag(LLLLoc, diag::err_undeclared_var_use)
29                      << "cudaConfigureCall");
30   QualType ConfigQTy = ConfigDecl->getType();
31 
32   DeclRefExpr *ConfigDR = new (Context)
33       DeclRefExpr(ConfigDecl, false, ConfigQTy, VK_LValue, LLLLoc);
34   MarkFunctionReferenced(LLLLoc, ConfigDecl);
35 
36   return ActOnCallExpr(S, ConfigDR, LLLLoc, ExecConfig, GGGLoc, nullptr,
37                        /*IsExecConfig=*/true);
38 }
39 
40 /// IdentifyCUDATarget - Determine the CUDA compilation target for this function
IdentifyCUDATarget(const FunctionDecl * D)41 Sema::CUDAFunctionTarget Sema::IdentifyCUDATarget(const FunctionDecl *D) {
42   if (D->hasAttr<CUDAInvalidTargetAttr>())
43     return CFT_InvalidTarget;
44 
45   if (D->hasAttr<CUDAGlobalAttr>())
46     return CFT_Global;
47 
48   if (D->hasAttr<CUDADeviceAttr>()) {
49     if (D->hasAttr<CUDAHostAttr>())
50       return CFT_HostDevice;
51     return CFT_Device;
52   } else if (D->hasAttr<CUDAHostAttr>()) {
53     return CFT_Host;
54   } else if (D->isImplicit()) {
55     // Some implicit declarations (like intrinsic functions) are not marked.
56     // Set the most lenient target on them for maximal flexibility.
57     return CFT_HostDevice;
58   }
59 
60   return CFT_Host;
61 }
62 
CheckCUDATarget(const FunctionDecl * Caller,const FunctionDecl * Callee)63 bool Sema::CheckCUDATarget(const FunctionDecl *Caller,
64                            const FunctionDecl *Callee) {
65   // The CUDADisableTargetCallChecks short-circuits this check: we assume all
66   // cross-target calls are valid.
67   if (getLangOpts().CUDADisableTargetCallChecks)
68     return false;
69 
70   CUDAFunctionTarget CallerTarget = IdentifyCUDATarget(Caller),
71                      CalleeTarget = IdentifyCUDATarget(Callee);
72 
73   // If one of the targets is invalid, the check always fails, no matter what
74   // the other target is.
75   if (CallerTarget == CFT_InvalidTarget || CalleeTarget == CFT_InvalidTarget)
76     return true;
77 
78   // CUDA B.1.1 "The __device__ qualifier declares a function that is [...]
79   // Callable from the device only."
80   if (CallerTarget == CFT_Host && CalleeTarget == CFT_Device)
81     return true;
82 
83   // CUDA B.1.2 "The __global__ qualifier declares a function that is [...]
84   // Callable from the host only."
85   // CUDA B.1.3 "The __host__ qualifier declares a function that is [...]
86   // Callable from the host only."
87   if ((CallerTarget == CFT_Device || CallerTarget == CFT_Global) &&
88       (CalleeTarget == CFT_Host || CalleeTarget == CFT_Global))
89     return true;
90 
91   // CUDA B.1.3 "The __device__ and __host__ qualifiers can be used together
92   // however, in which case the function is compiled for both the host and the
93   // device. The __CUDA_ARCH__ macro [...] can be used to differentiate code
94   // paths between host and device."
95   if (CallerTarget == CFT_HostDevice && CalleeTarget != CFT_HostDevice) {
96     // If the caller is implicit then the check always passes.
97     if (Caller->isImplicit()) return false;
98 
99     bool InDeviceMode = getLangOpts().CUDAIsDevice;
100     if (!InDeviceMode && CalleeTarget != CFT_Host)
101         return true;
102     if (InDeviceMode && CalleeTarget != CFT_Device) {
103       // Allow host device functions to call host functions if explicitly
104       // requested.
105       if (CalleeTarget == CFT_Host &&
106           getLangOpts().CUDAAllowHostCallsFromHostDevice) {
107         Diag(Caller->getLocation(),
108              diag::warn_host_calls_from_host_device)
109             << Callee->getNameAsString() << Caller->getNameAsString();
110         return false;
111       }
112 
113       return true;
114     }
115   }
116 
117   return false;
118 }
119 
120 /// When an implicitly-declared special member has to invoke more than one
121 /// base/field special member, conflicts may occur in the targets of these
122 /// members. For example, if one base's member __host__ and another's is
123 /// __device__, it's a conflict.
124 /// This function figures out if the given targets \param Target1 and
125 /// \param Target2 conflict, and if they do not it fills in
126 /// \param ResolvedTarget with a target that resolves for both calls.
127 /// \return true if there's a conflict, false otherwise.
128 static bool
resolveCalleeCUDATargetConflict(Sema::CUDAFunctionTarget Target1,Sema::CUDAFunctionTarget Target2,Sema::CUDAFunctionTarget * ResolvedTarget)129 resolveCalleeCUDATargetConflict(Sema::CUDAFunctionTarget Target1,
130                                 Sema::CUDAFunctionTarget Target2,
131                                 Sema::CUDAFunctionTarget *ResolvedTarget) {
132   if (Target1 == Sema::CFT_Global && Target2 == Sema::CFT_Global) {
133     // TODO: this shouldn't happen, really. Methods cannot be marked __global__.
134     // Clang should detect this earlier and produce an error. Then this
135     // condition can be changed to an assertion.
136     return true;
137   }
138 
139   if (Target1 == Sema::CFT_HostDevice) {
140     *ResolvedTarget = Target2;
141   } else if (Target2 == Sema::CFT_HostDevice) {
142     *ResolvedTarget = Target1;
143   } else if (Target1 != Target2) {
144     return true;
145   } else {
146     *ResolvedTarget = Target1;
147   }
148 
149   return false;
150 }
151 
inferCUDATargetForImplicitSpecialMember(CXXRecordDecl * ClassDecl,CXXSpecialMember CSM,CXXMethodDecl * MemberDecl,bool ConstRHS,bool Diagnose)152 bool Sema::inferCUDATargetForImplicitSpecialMember(CXXRecordDecl *ClassDecl,
153                                                    CXXSpecialMember CSM,
154                                                    CXXMethodDecl *MemberDecl,
155                                                    bool ConstRHS,
156                                                    bool Diagnose) {
157   llvm::Optional<CUDAFunctionTarget> InferredTarget;
158 
159   // We're going to invoke special member lookup; mark that these special
160   // members are called from this one, and not from its caller.
161   ContextRAII MethodContext(*this, MemberDecl);
162 
163   // Look for special members in base classes that should be invoked from here.
164   // Infer the target of this member base on the ones it should call.
165   // Skip direct and indirect virtual bases for abstract classes.
166   llvm::SmallVector<const CXXBaseSpecifier *, 16> Bases;
167   for (const auto &B : ClassDecl->bases()) {
168     if (!B.isVirtual()) {
169       Bases.push_back(&B);
170     }
171   }
172 
173   if (!ClassDecl->isAbstract()) {
174     for (const auto &VB : ClassDecl->vbases()) {
175       Bases.push_back(&VB);
176     }
177   }
178 
179   for (const auto *B : Bases) {
180     const RecordType *BaseType = B->getType()->getAs<RecordType>();
181     if (!BaseType) {
182       continue;
183     }
184 
185     CXXRecordDecl *BaseClassDecl = cast<CXXRecordDecl>(BaseType->getDecl());
186     Sema::SpecialMemberOverloadResult *SMOR =
187         LookupSpecialMember(BaseClassDecl, CSM,
188                             /* ConstArg */ ConstRHS,
189                             /* VolatileArg */ false,
190                             /* RValueThis */ false,
191                             /* ConstThis */ false,
192                             /* VolatileThis */ false);
193 
194     if (!SMOR || !SMOR->getMethod()) {
195       continue;
196     }
197 
198     CUDAFunctionTarget BaseMethodTarget = IdentifyCUDATarget(SMOR->getMethod());
199     if (!InferredTarget.hasValue()) {
200       InferredTarget = BaseMethodTarget;
201     } else {
202       bool ResolutionError = resolveCalleeCUDATargetConflict(
203           InferredTarget.getValue(), BaseMethodTarget,
204           InferredTarget.getPointer());
205       if (ResolutionError) {
206         if (Diagnose) {
207           Diag(ClassDecl->getLocation(),
208                diag::note_implicit_member_target_infer_collision)
209               << (unsigned)CSM << InferredTarget.getValue() << BaseMethodTarget;
210         }
211         MemberDecl->addAttr(CUDAInvalidTargetAttr::CreateImplicit(Context));
212         return true;
213       }
214     }
215   }
216 
217   // Same as for bases, but now for special members of fields.
218   for (const auto *F : ClassDecl->fields()) {
219     if (F->isInvalidDecl()) {
220       continue;
221     }
222 
223     const RecordType *FieldType =
224         Context.getBaseElementType(F->getType())->getAs<RecordType>();
225     if (!FieldType) {
226       continue;
227     }
228 
229     CXXRecordDecl *FieldRecDecl = cast<CXXRecordDecl>(FieldType->getDecl());
230     Sema::SpecialMemberOverloadResult *SMOR =
231         LookupSpecialMember(FieldRecDecl, CSM,
232                             /* ConstArg */ ConstRHS && !F->isMutable(),
233                             /* VolatileArg */ false,
234                             /* RValueThis */ false,
235                             /* ConstThis */ false,
236                             /* VolatileThis */ false);
237 
238     if (!SMOR || !SMOR->getMethod()) {
239       continue;
240     }
241 
242     CUDAFunctionTarget FieldMethodTarget =
243         IdentifyCUDATarget(SMOR->getMethod());
244     if (!InferredTarget.hasValue()) {
245       InferredTarget = FieldMethodTarget;
246     } else {
247       bool ResolutionError = resolveCalleeCUDATargetConflict(
248           InferredTarget.getValue(), FieldMethodTarget,
249           InferredTarget.getPointer());
250       if (ResolutionError) {
251         if (Diagnose) {
252           Diag(ClassDecl->getLocation(),
253                diag::note_implicit_member_target_infer_collision)
254               << (unsigned)CSM << InferredTarget.getValue()
255               << FieldMethodTarget;
256         }
257         MemberDecl->addAttr(CUDAInvalidTargetAttr::CreateImplicit(Context));
258         return true;
259       }
260     }
261   }
262 
263   if (InferredTarget.hasValue()) {
264     if (InferredTarget.getValue() == CFT_Device) {
265       MemberDecl->addAttr(CUDADeviceAttr::CreateImplicit(Context));
266     } else if (InferredTarget.getValue() == CFT_Host) {
267       MemberDecl->addAttr(CUDAHostAttr::CreateImplicit(Context));
268     } else {
269       MemberDecl->addAttr(CUDADeviceAttr::CreateImplicit(Context));
270       MemberDecl->addAttr(CUDAHostAttr::CreateImplicit(Context));
271     }
272   } else {
273     // If no target was inferred, mark this member as __host__ __device__;
274     // it's the least restrictive option that can be invoked from any target.
275     MemberDecl->addAttr(CUDADeviceAttr::CreateImplicit(Context));
276     MemberDecl->addAttr(CUDAHostAttr::CreateImplicit(Context));
277   }
278 
279   return false;
280 }
281