Skip to content

Commit

Permalink
[OpenCL] AMDGCN target will generate images in constant address space
Browse files Browse the repository at this point in the history
Allows AMDGCN target to generate images (such as %opencl.image2d_t) in constant address space.
Images will still be generated in global address space by default.

Added tests to existing opencl-types.cl in test\CodeGenOpenCL.

Patch by Aaron En Ye Shi.

Differential Revision: https://reviews.llvm.org/D22523

llvm-svn: 276161
  • Loading branch information
yxsamliu committed Jul 20, 2016
1 parent d3f047a commit 37ceede
Show file tree
Hide file tree
Showing 4 changed files with 39 additions and 16 deletions.
3 changes: 2 additions & 1 deletion clang/lib/CodeGen/CGOpenCLRuntime.cpp
Expand Up @@ -15,6 +15,7 @@

#include "CGOpenCLRuntime.h"
#include "CodeGenFunction.h"
#include "TargetInfo.h"
#include "llvm/IR/DerivedTypes.h"
#include "llvm/IR/GlobalValue.h"
#include <assert.h>
Expand All @@ -35,7 +36,7 @@ llvm::Type *CGOpenCLRuntime::convertOpenCLSpecificType(const Type *T) {

llvm::LLVMContext& Ctx = CGM.getLLVMContext();
uint32_t ImgAddrSpc =
CGM.getContext().getTargetAddressSpace(LangAS::opencl_global);
CGM.getTargetCodeGenInfo().getOpenCLImageAddrSpace(CGM);
switch (cast<BuiltinType>(T)->getKind()) {
default:
llvm_unreachable("Unexpected opencl builtin type!");
Expand Down
10 changes: 10 additions & 0 deletions clang/lib/CodeGen/TargetInfo.cpp
Expand Up @@ -375,6 +375,11 @@ TargetCodeGenInfo::getDependentLibraryOption(llvm::StringRef Lib,
unsigned TargetCodeGenInfo::getOpenCLKernelCallingConv() const {
return llvm::CallingConv::C;
}

unsigned TargetCodeGenInfo::getOpenCLImageAddrSpace(CodeGen::CodeGenModule &CGM) const {
return CGM.getContext().getTargetAddressSpace(LangAS::opencl_global);
}

static bool isEmptyRecord(ASTContext &Context, QualType T, bool AllowArrays);

/// isEmptyField - Return true iff a the field is "empty", that is it
Expand Down Expand Up @@ -6832,6 +6837,7 @@ class AMDGPUTargetCodeGenInfo : public TargetCodeGenInfo {
void setTargetAttributes(const Decl *D, llvm::GlobalValue *GV,
CodeGen::CodeGenModule &M) const override;
unsigned getOpenCLKernelCallingConv() const override;
unsigned getOpenCLImageAddrSpace(CodeGen::CodeGenModule &CGM) const override;
};

}
Expand Down Expand Up @@ -6868,6 +6874,10 @@ unsigned AMDGPUTargetCodeGenInfo::getOpenCLKernelCallingConv() const {
return llvm::CallingConv::AMDGPU_KERNEL;
}

unsigned AMDGPUTargetCodeGenInfo::getOpenCLImageAddrSpace(CodeGen::CodeGenModule &CGM) const {
return CGM.getContext().getTargetAddressSpace(LangAS::opencl_constant);
}

//===----------------------------------------------------------------------===//
// SPARC v8 ABI Implementation.
// Based on the SPARC Compliance Definition version 2.4.1.
Expand Down
3 changes: 3 additions & 0 deletions clang/lib/CodeGen/TargetInfo.h
Expand Up @@ -220,6 +220,9 @@ class TargetCodeGenInfo {

/// Get LLVM calling convention for OpenCL kernel.
virtual unsigned getOpenCLKernelCallingConv() const;

/// Get LLVM Image Address Space for OpenCL kernel.
virtual unsigned getOpenCLImageAddrSpace(CodeGen::CodeGenModule &CGM) const;
};

} // namespace CodeGen
Expand Down
39 changes: 24 additions & 15 deletions clang/test/CodeGenOpenCL/opencl_types.cl
@@ -1,40 +1,49 @@
// RUN: %clang_cc1 %s -emit-llvm -o - -O0 | FileCheck %s
// RUN: %clang_cc1 %s -triple "spir-unknown-unknown" -emit-llvm -o - -O0 | FileCheck %s --check-prefix=CHECK-SPIR
// RUN: %clang_cc1 %s -triple "amdgcn--amdhsa" -emit-llvm -o - -O0 | FileCheck %s --check-prefix=CHECK-AMDGCN

constant sampler_t glb_smp = 7;
// CHECK: constant i32 7
// CHECK-SPIR: constant i32 7
// CHECK-AMDGCN: addrspace(2) constant i32 7

void fnc1(image1d_t img) {}
// CHECK: @fnc1(%opencl.image1d_ro_t*
// CHECK-SPIR: @fnc1(%opencl.image1d_ro_t addrspace(1)*
// CHECK-AMDGCN: @fnc1(%opencl.image1d_ro_t addrspace(2)*

void fnc1arr(image1d_array_t img) {}
// CHECK: @fnc1arr(%opencl.image1d_array_ro_t*
// CHECK-SPIR: @fnc1arr(%opencl.image1d_array_ro_t addrspace(1)*
// CHECK-AMDGCN: @fnc1arr(%opencl.image1d_array_ro_t addrspace(2)*

void fnc1buff(image1d_buffer_t img) {}
// CHECK: @fnc1buff(%opencl.image1d_buffer_ro_t*
// CHECK-SPIR: @fnc1buff(%opencl.image1d_buffer_ro_t addrspace(1)*
// CHECK-AMDGCN: @fnc1buff(%opencl.image1d_buffer_ro_t addrspace(2)*

void fnc2(image2d_t img) {}
// CHECK: @fnc2(%opencl.image2d_ro_t*
// CHECK-SPIR: @fnc2(%opencl.image2d_ro_t addrspace(1)*
// CHECK-AMDGCN: @fnc2(%opencl.image2d_ro_t addrspace(2)*

void fnc2arr(image2d_array_t img) {}
// CHECK: @fnc2arr(%opencl.image2d_array_ro_t*
// CHECK-SPIR: @fnc2arr(%opencl.image2d_array_ro_t addrspace(1)*
// CHECK-AMDGCN: @fnc2arr(%opencl.image2d_array_ro_t addrspace(2)*

void fnc3(image3d_t img) {}
// CHECK: @fnc3(%opencl.image3d_ro_t*
// CHECK-SPIR: @fnc3(%opencl.image3d_ro_t addrspace(1)*
// CHECK-AMDGCN: @fnc3(%opencl.image3d_ro_t addrspace(2)*

void fnc4smp(sampler_t s) {}
// CHECK-LABEL: define {{.*}}void @fnc4smp(i32
// CHECK-SPIR-LABEL: define {{.*}}void @fnc4smp(i32

kernel void foo(image1d_t img) {
sampler_t smp = 5;
// CHECK: alloca i32
// CHECK-SPIR: alloca i32
event_t evt;
// CHECK: alloca %opencl.event_t*
// CHECK: store i32 5,
// CHECK-SPIR: alloca %opencl.event_t*
// CHECK-SPIR: store i32 5,
fnc4smp(smp);
// CHECK: call {{.*}}void @fnc4smp(i32
// CHECK-SPIR: call {{.*}}void @fnc4smp(i32
fnc4smp(glb_smp);
// CHECK: call {{.*}}void @fnc4smp(i32
// CHECK-SPIR: call {{.*}}void @fnc4smp(i32
}

void __attribute__((overloadable)) bad1(image1d_t b, image2d_t c, image2d_t d) {}
// CHECK-LABEL: @{{_Z4bad114ocl_image1d_ro14ocl_image2d_roS0_|"\\01\?bad1@@\$\$J0YAXPAUocl_image1d_ro@@PAUocl_image2d_ro@@1@Z"}}
// CHECK-SPIR-LABEL: @{{_Z4bad114ocl_image1d_ro14ocl_image2d_roS0_|"\\01\?bad1@@\$\$J0YAXPAUocl_image1d_ro@@PAUocl_image2d_ro@@1@Z"}}
// CHECK-AMDGCN-LABEL: @{{_Z4bad114ocl_image1d_ro14ocl_image2d_roS0_|"\\01\?bad1@@\$\$J0YAXPAUocl_image1d_ro@@PAUocl_image2d_ro@@1@Z"}}(%opencl.image1d_ro_t addrspace(2)*{{.*}}%opencl.image2d_ro_t addrspace(2)*{{.*}}%opencl.image2d_ro_t addrspace(2)*{{.*}})

0 comments on commit 37ceede

Please sign in to comment.