Skip to content

Commit

Permalink
AMDGPU/SI: Use amdgpu_kernel calling convention for OpenCL kernels.
Browse files Browse the repository at this point in the history
Reviewers: tstellarAMD, arsenm

Subscribers: cfe-commits

Differential Revision: http://reviews.llvm.org/D19918

llvm-svn: 268718
  • Loading branch information
Nikolay Haustov authored and Nikolay Haustov committed May 6, 2016
1 parent 1f7732a commit 4961ea8
Show file tree
Hide file tree
Showing 3 changed files with 24 additions and 4 deletions.
8 changes: 8 additions & 0 deletions clang/lib/CodeGen/TargetInfo.cpp
Expand Up @@ -6826,6 +6826,14 @@ void AMDGPUTargetCodeGenInfo::setTargetAttributes(
if (!FD)
return;

if (M.getLangOpts().OpenCL) {
if (FD->hasAttr<OpenCLKernelAttr>()) {
// Set amdgpu_kernel calling convention for OpenCL kernels.
llvm::Function *Fn = cast<llvm::Function>(GV);
Fn->setCallingConv(llvm::CallingConv::AMDGPU_KERNEL);
}
}

if (const auto Attr = FD->getAttr<AMDGPUNumVGPRAttr>()) {
llvm::Function *F = cast<llvm::Function>(GV);
uint32_t NumVGPR = Attr->getNumVGPR();
Expand Down
12 changes: 12 additions & 0 deletions clang/test/CodeGenOpenCL/amdgpu-calling-conv.cl
@@ -0,0 +1,12 @@
// REQUIRES: amdgpu-registered-target
// RUN: %clang_cc1 -triple amdgcn-unknown-unknown -S -emit-llvm -o - %s | FileCheck %s

// CHECK: define amdgpu_kernel void @calling_conv_amdgpu_kernel()
kernel void calling_conv_amdgpu_kernel()
{
}

// CHECK: define void @calling_conv_none()
void calling_conv_none()
{
}
8 changes: 4 additions & 4 deletions clang/test/CodeGenOpenCL/amdgpu-num-gpr-attr.cl
Expand Up @@ -5,23 +5,23 @@

__attribute__((amdgpu_num_vgpr(64))) // expected-no-diagnostics
kernel void test_num_vgpr64() {
// CHECK: define void @test_num_vgpr64() [[ATTR_VGPR64:#[0-9]+]]
// CHECK: define amdgpu_kernel void @test_num_vgpr64() [[ATTR_VGPR64:#[0-9]+]]
}

__attribute__((amdgpu_num_sgpr(32))) // expected-no-diagnostics
kernel void test_num_sgpr32() {
// CHECK: define void @test_num_sgpr32() [[ATTR_SGPR32:#[0-9]+]]
// CHECK: define amdgpu_kernel void @test_num_sgpr32() [[ATTR_SGPR32:#[0-9]+]]
}

__attribute__((amdgpu_num_vgpr(64), amdgpu_num_sgpr(32))) // expected-no-diagnostics
kernel void test_num_vgpr64_sgpr32() {
// CHECK: define void @test_num_vgpr64_sgpr32() [[ATTR_VGPR64_SGPR32:#[0-9]+]]
// CHECK: define amdgpu_kernel void @test_num_vgpr64_sgpr32() [[ATTR_VGPR64_SGPR32:#[0-9]+]]

}

__attribute__((amdgpu_num_sgpr(20), amdgpu_num_vgpr(40))) // expected-no-diagnostics
kernel void test_num_sgpr20_vgpr40() {
// CHECK: define void @test_num_sgpr20_vgpr40() [[ATTR_SGPR20_VGPR40:#[0-9]+]]
// CHECK: define amdgpu_kernel void @test_num_sgpr20_vgpr40() [[ATTR_SGPR20_VGPR40:#[0-9]+]]
}

__attribute__((amdgpu_num_vgpr(0))) // expected-no-diagnostics
Expand Down

0 comments on commit 4961ea8

Please sign in to comment.