Skip to content

Commit

Permalink
[AMDGPU] Add ds_fadd, ds_fmin, ds_fmax builtins functions
Browse files Browse the repository at this point in the history
Reviewed by arsenm

Differential Revision: https://reviews.llvm.org/D42578

llvm-svn: 323890
  • Loading branch information
dfukalov committed Jan 31, 2018
1 parent 82a8339 commit e72cde5
Show file tree
Hide file tree
Showing 2 changed files with 23 additions and 0 deletions.
3 changes: 3 additions & 0 deletions clang/include/clang/Basic/BuiltinsAMDGPU.def
Expand Up @@ -93,6 +93,9 @@ BUILTIN(__builtin_amdgcn_ds_bpermute, "iii", "nc")
BUILTIN(__builtin_amdgcn_readfirstlane, "ii", "nc")
BUILTIN(__builtin_amdgcn_readlane, "iii", "nc")
BUILTIN(__builtin_amdgcn_fmed3f, "ffff", "nc")
BUILTIN(__builtin_amdgcn_ds_fadd, "ff*3fiib", "n")
BUILTIN(__builtin_amdgcn_ds_fmin, "ff*3fiib", "n")
BUILTIN(__builtin_amdgcn_ds_fmax, "ff*3fiib", "n")

//===----------------------------------------------------------------------===//
// VI+ only builtins.
Expand Down
20 changes: 20 additions & 0 deletions clang/test/CodeGenOpenCL/builtins-amdgcn-vi.cl
Expand Up @@ -89,3 +89,23 @@ void test_mov_dpp(global int* out, int src)
*out = __builtin_amdgcn_mov_dpp(src, 0, 0, 0, false);
}

// CHECK-LABEL: @test_ds_fadd
// CHECK: call float @llvm.amdgcn.ds.fadd(float addrspace(3)* %out, float %src, i32 0, i32 0, i1 false)
void test_ds_fadd(local float *out, float src)
{
*out = __builtin_amdgcn_ds_fadd(out, src, 0, 0, false);
}

// CHECK-LABEL: @test_ds_fmin
// CHECK: call float @llvm.amdgcn.ds.fmin(float addrspace(3)* %out, float %src, i32 0, i32 0, i1 false)
void test_ds_fmin(local float *out, float src)
{
*out = __builtin_amdgcn_ds_fmin(out, src, 0, 0, false);
}

// CHECK-LABEL: @test_ds_fmax
// CHECK: call float @llvm.amdgcn.ds.fmax(float addrspace(3)* %out, float %src, i32 0, i32 0, i1 false)
void test_ds_fmax(local float *out, float src)
{
*out = __builtin_amdgcn_ds_fmax(out, src, 0, 0, false);
}

0 comments on commit e72cde5

Please sign in to comment.