Skip to content

Commit

Permalink
[CUDA] __global__ functions should always be visible externally.
Browse files Browse the repository at this point in the history
Adjust __global__ functions with DiscardableODR linkage to use
StrongODR linkage instead, so they are visible externally.

Differential Revision: http://reviews.llvm.org/D13067

llvm-svn: 248400
  • Loading branch information
Artem-B committed Sep 23, 2015
1 parent ade3abd commit 7b41f70
Show file tree
Hide file tree
Showing 3 changed files with 7 additions and 15 deletions.
12 changes: 6 additions & 6 deletions clang/lib/AST/ASTContext.cpp
Expand Up @@ -8284,22 +8284,22 @@ static GVALinkage basicGVALinkageForFunction(const ASTContext &Context,
return GVA_DiscardableODR;
}

static GVALinkage adjustGVALinkageForDLLAttribute(GVALinkage L, const Decl *D) {
static GVALinkage adjustGVALinkageForAttributes(GVALinkage L, const Decl *D) {
// See http://msdn.microsoft.com/en-us/library/xa0d9ste.aspx
// dllexport/dllimport on inline functions.
if (D->hasAttr<DLLImportAttr>()) {
if (L == GVA_DiscardableODR || L == GVA_StrongODR)
return GVA_AvailableExternally;
} else if (D->hasAttr<DLLExportAttr>()) {
} else if (D->hasAttr<DLLExportAttr>() || D->hasAttr<CUDAGlobalAttr>()) {
if (L == GVA_DiscardableODR)
return GVA_StrongODR;
}
return L;
}

GVALinkage ASTContext::GetGVALinkageForFunction(const FunctionDecl *FD) const {
return adjustGVALinkageForDLLAttribute(basicGVALinkageForFunction(*this, FD),
FD);
return adjustGVALinkageForAttributes(basicGVALinkageForFunction(*this, FD),
FD);
}

static GVALinkage basicGVALinkageForVariable(const ASTContext &Context,
Expand Down Expand Up @@ -8355,8 +8355,8 @@ static GVALinkage basicGVALinkageForVariable(const ASTContext &Context,
}

GVALinkage ASTContext::GetGVALinkageForVariable(const VarDecl *VD) {
return adjustGVALinkageForDLLAttribute(basicGVALinkageForVariable(*this, VD),
VD);
return adjustGVALinkageForAttributes(basicGVALinkageForVariable(*this, VD),
VD);
}

bool ASTContext::DeclMustBeEmitted(const Decl *D) {
Expand Down
3 changes: 0 additions & 3 deletions clang/lib/Sema/SemaDeclAttr.cpp
Expand Up @@ -3351,9 +3351,6 @@ static void handleGlobalAttr(Sema &S, Decl *D, const AttributeList &Attr) {
CUDAGlobalAttr(Attr.getRange(), S.Context,
Attr.getAttributeSpellingListIndex()));

// Add implicit attribute((used)) so we don't eliminate kernels
// because there is nothing referencing them on device side.
D->addAttr(UsedAttr::CreateImplicit(S.Context));
}

static void handleGNUInlineAttr(Sema &S, Decl *D, const AttributeList &Attr) {
Expand Down
7 changes: 1 addition & 6 deletions clang/test/CodeGenCUDA/ptx-kernels.cu
Expand Up @@ -6,11 +6,6 @@

#include "Inputs/cuda.h"

// Make sure that all __global__ functions are added to @llvm.used
// CHECK: @llvm.used = appending global
// CHECK-SAME: @global_function
// CHECK-SAME: @_Z16templated_kernelIiEvT_

// CHECK-LABEL: define void @device_function
extern "C"
__device__ void device_function() {}
Expand All @@ -24,7 +19,7 @@ __global__ void global_function() {

// Make sure host-instantiated kernels are preserved on device side.
template <typename T> __global__ void templated_kernel(T param) {}
// CHECK-LABEL: define linkonce_odr void @_Z16templated_kernelIiEvT_
// CHECK-LABEL: define weak_odr void @_Z16templated_kernelIiEvT_
void host_function() { templated_kernel<<<0,0>>>(0); }

// CHECK: !{{[0-9]+}} = !{void ()* @global_function, !"kernel", i32 1}
Expand Down

0 comments on commit 7b41f70

Please sign in to comment.