Skip to content

Commit

Permalink
[HIP] change kernel stub name
Browse files Browse the repository at this point in the history
Add .stub to kernel stub function name so that it is different from kernel
name in device code. This is necessary to let debugger find correct symbol
for kernel.

Differential Revision: https://reviews.llvm.org/D58518

llvm-svn: 354948
  • Loading branch information
yxsamliu committed Feb 27, 2019
1 parent c4eff21 commit e739ac0
Show file tree
Hide file tree
Showing 3 changed files with 32 additions and 2 deletions.
1 change: 1 addition & 0 deletions clang/lib/CodeGen/CGCUDANV.cpp
Expand Up @@ -218,6 +218,7 @@ std::string CGNVCUDARuntime::getDeviceSideName(const Decl *D) {
void CGNVCUDARuntime::emitDeviceStub(CodeGenFunction &CGF,
FunctionArgList &Args) {
assert(getDeviceSideName(CGF.CurFuncDecl) == CGF.CurFn->getName() ||
getDeviceSideName(CGF.CurFuncDecl) + ".stub" == CGF.CurFn->getName() ||
CGF.CGM.getContext().getTargetInfo().getCXXABI() !=
CGF.CGM.getContext().getAuxTargetInfo()->getCXXABI());

Expand Down
13 changes: 11 additions & 2 deletions clang/lib/CodeGen/CodeGenModule.cpp
Expand Up @@ -1048,8 +1048,17 @@ StringRef CodeGenModule::getMangledName(GlobalDecl GD) {

// Keep the first result in the case of a mangling collision.
const auto *ND = cast<NamedDecl>(GD.getDecl());
auto Result =
Manglings.insert(std::make_pair(getMangledNameImpl(*this, GD, ND), GD));
std::string MangledName = getMangledNameImpl(*this, GD, ND);

// Postfix kernel stub names with .stub to differentiate them from kernel
// names in device binaries. This is to facilitate the debugger to find
// the correct symbols for kernels in the device binary.
if (auto *FD = dyn_cast<FunctionDecl>(GD.getDecl()))
if (getLangOpts().HIP && !getLangOpts().CUDAIsDevice &&
FD->hasAttr<CUDAGlobalAttr>())
MangledName = MangledName + ".stub";

auto Result = Manglings.insert(std::make_pair(MangledName, GD));
return MangledDeclNames[CanonicalGD] = Result.first->first();
}

Expand Down
20 changes: 20 additions & 0 deletions clang/test/CodeGenCUDA/kernel-stub-name.cu
@@ -0,0 +1,20 @@
// RUN: echo "GPU binary would be here" > %t

// RUN: %clang_cc1 -triple x86_64-linux-gnu -emit-llvm %s \
// RUN: -fcuda-include-gpubinary %t -o - -x hip\
// RUN: | FileCheck -allow-deprecated-dag-overlap %s --check-prefixes=CHECK

#include "Inputs/cuda.h"

template<class T>
__global__ void kernelfunc() {}

// CHECK-LABEL: define{{.*}}@_Z8hostfuncv()
// CHECK: call void @[[STUB:_Z10kernelfuncIiEvv.stub]]()
void hostfunc(void) { kernelfunc<int><<<1, 1>>>(); }

// CHECK: define{{.*}}@[[STUB]]
// CHECK: call{{.*}}@hipLaunchByPtr{{.*}}@[[STUB]]

// CHECK-LABEL: define{{.*}}@__hip_register_globals
// CHECK: call{{.*}}@__hipRegisterFunction{{.*}}@[[STUB]]

0 comments on commit e739ac0

Please sign in to comment.