From 8310438f26309f7817aa96ed81853ed5f9a69907 Mon Sep 17 00:00:00 2001 From: Tom Stellard Date: Sat, 4 Jun 2016 03:43:05 +0000 Subject: [PATCH] Merging r268259: ------------------------------------------------------------------------ r268259 | nhaehnle | 2016-05-02 10:37:01 -0700 (Mon, 02 May 2016) | 14 lines AMDGPU: llvm.SI.fs.constant is a source of divergence Summary: This intrinsic is used to get flat-shaded fragment shader inputs. Those are uniform across a primitive, but a fragment shader wave may process pixels from multiple primitives (as indicated by the prim_mask), and so that's where divergence can arise. Reviewers: arsenm, tstellarAMD Subscribers: arsenm, llvm-commits Differential Revision: http://reviews.llvm.org/D19747 ------------------------------------------------------------------------ llvm-svn: 271769 --- .../AMDGPU/AMDGPUTargetTransformInfo.cpp | 1 + .../AMDGPU/interp-intrinsics.ll | 23 +++++++++++++++++++ 2 files changed, 24 insertions(+) create mode 100644 llvm/test/Analysis/DivergenceAnalysis/AMDGPU/interp-intrinsics.ll diff --git a/llvm/lib/Target/AMDGPU/AMDGPUTargetTransformInfo.cpp b/llvm/lib/Target/AMDGPU/AMDGPUTargetTransformInfo.cpp index 54a003d6a9cf9..5d347722363a0 100644 --- a/llvm/lib/Target/AMDGPU/AMDGPUTargetTransformInfo.cpp +++ b/llvm/lib/Target/AMDGPU/AMDGPUTargetTransformInfo.cpp @@ -131,6 +131,7 @@ static bool isIntrinsicSourceOfDivergence(const TargetIntrinsicInfo *TII, return false; case AMDGPUIntrinsic::SI_tid: case AMDGPUIntrinsic::SI_fs_interp: + case AMDGPUIntrinsic::SI_fs_constant: return true; } } diff --git a/llvm/test/Analysis/DivergenceAnalysis/AMDGPU/interp-intrinsics.ll b/llvm/test/Analysis/DivergenceAnalysis/AMDGPU/interp-intrinsics.ll new file mode 100644 index 0000000000000..902cf0eed40b0 --- /dev/null +++ b/llvm/test/Analysis/DivergenceAnalysis/AMDGPU/interp-intrinsics.ll @@ -0,0 +1,23 @@ +; RUN: opt -mtriple amdgcn--- -analyze -divergence %s | FileCheck %s + +; CHECK-LABEL: 'fs_interp' +; CHECK: DIVERGENT: %v = call float @llvm.SI.fs.interp( +define void @fs_interp(i32 inreg %prim_mask, <2 x i32> %interp_param) #1 { + %v = call float @llvm.SI.fs.interp(i32 0, i32 0, i32 %prim_mask, <2 x i32> %interp_param) + store volatile float %v, float addrspace(1)* undef + ret void +} + +; CHECK-LABEL: 'fs_constant' +; CHECK: DIVERGENT: %v = call float @llvm.SI.fs.constant( +define void @fs_constant(i32 inreg %prim_mask, <2 x i32> %interp_param) #1 { + %v = call float @llvm.SI.fs.constant(i32 0, i32 0, i32 %prim_mask) + store volatile float %v, float addrspace(1)* undef + ret void +} + +declare float @llvm.SI.fs.interp(i32, i32, i32, <2 x i32>) #0 +declare float @llvm.SI.fs.constant(i32, i32, i32) #0 + +attributes #0 = { nounwind readnone } +attributes #1 = { "ShaderType"="1"}