506 changes: 247 additions & 259 deletions llvm/test/CodeGen/AMDGPU/shift-i128.ll

Large diffs are not rendered by default.

19 changes: 6 additions & 13 deletions llvm/test/CodeGen/AMDGPU/sint_to_fp.f64.ll
Original file line number Diff line number Diff line change
Expand Up @@ -15,19 +15,12 @@ define amdgpu_kernel void @sint_to_fp_i32_to_f64(double addrspace(1)* %out, i32
; uses an SGPR (implicit vcc).

; GCN-LABEL: {{^}}sint_to_fp_i1_f64:
; VI-DAG: s_cmp_eq_u32
; VI-DAG: s_cselect_b32 s[[SSEL:[0-9]+]], 0xbff00000, 0
; VI-DAG: v_mov_b32_e32 v[[ZERO:[0-9]+]], 0{{$}}
; VI-DAG: v_mov_b32_e32 v[[SEL:[0-9]+]], s[[SSEL]]
; VI: flat_store_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, v[[[ZERO]]:[[SEL]]]
; VI: s_endpgm

; CI-DAG: s_cmp_eq_u32
; CI-DAG: s_cselect_b64 vcc, -1, 0
; CI-DAG: v_cndmask_b32_e32 v[[SEL:[0-9]+]], 0, v{{[0-9]+}}, vcc
; CI-DAG: v_mov_b32_e32 v[[ZERO:[0-9]+]], 0{{$}}
; CI: flat_store_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, v[[[ZERO]]:[[SEL]]]
; CI: s_endpgm
; GCN-DAG: s_cmp_eq_u32
; GCN-DAG: s_cselect_b32 s[[SSEL:[0-9]+]], 0xbff00000, 0
; GCN-DAG: v_mov_b32_e32 v[[ZERO:[0-9]+]], 0{{$}}
; GCN-DAG: v_mov_b32_e32 v[[SEL:[0-9]+]], s[[SSEL]]
; GCN: flat_store_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, v[[[ZERO]]:[[SEL]]]
; GCN: s_endpgm
define amdgpu_kernel void @sint_to_fp_i1_f64(double addrspace(1)* %out, i32 %in) {
%cmp = icmp eq i32 %in, 0
%fp = sitofp i1 %cmp to double
Expand Down
992 changes: 509 additions & 483 deletions llvm/test/CodeGen/AMDGPU/srem64.ll

Large diffs are not rendered by default.

4 changes: 1 addition & 3 deletions llvm/test/CodeGen/AMDGPU/trunc.ll
Original file line number Diff line number Diff line change
Expand Up @@ -96,9 +96,7 @@ define amdgpu_kernel void @sgpr_trunc_i32_to_i1(i32 addrspace(1)* %out, i32 %a)
; SI: s_load_dwordx2 s[[[SLO:[0-9]+]]:{{[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0x13
; VI: s_load_dwordx2 s[[[SLO:[0-9]+]]:{{[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0x4c
; GCN: s_bitcmp1_b32 s[[SLO]], 0
; SI: s_cselect_b64 s[[[VLO:[0-9]+]]:[[VHI:[0-9]+]]], -1, 0
; SI: v_cndmask_b32_e64 {{v[0-9]+}}, -12, 63, s[[[VLO]]:[[VHI]]]
; VI: s_cselect_b32 {{s[0-9]+}}, 63, -12
; GCN: s_cselect_b32 {{s[0-9]+}}, 63, -12
define amdgpu_kernel void @s_trunc_i64_to_i1(i32 addrspace(1)* %out, [8 x i32], i64 %x) {
%trunc = trunc i64 %x to i1
%sel = select i1 %trunc, i32 63, i32 -12
Expand Down
630 changes: 336 additions & 294 deletions llvm/test/CodeGen/AMDGPU/udiv.ll

Large diffs are not rendered by default.

391 changes: 191 additions & 200 deletions llvm/test/CodeGen/AMDGPU/udiv64.ll

Large diffs are not rendered by default.

301 changes: 160 additions & 141 deletions llvm/test/CodeGen/AMDGPU/udivrem.ll

Large diffs are not rendered by default.

7 changes: 2 additions & 5 deletions llvm/test/CodeGen/AMDGPU/uint_to_fp.f64.ll
Original file line number Diff line number Diff line change
Expand Up @@ -76,12 +76,9 @@ define amdgpu_kernel void @s_uint_to_fp_v4i32_to_v4f64(<4 x double> addrspace(1)

; GCN-LABEL: {{^}}uint_to_fp_i1_to_f64:
; VI-DAG: s_cmp_eq_u32
; VI-DAG: s_cselect_b32 s[[SSEL:[0-9]+]], 0x3ff00000, 0
; VI-DAG: v_mov_b32_e32 v[[SEL:[0-9]+]], s[[SSEL]]
; SI-DAG: s_cmp_eq_u32
; SI-DAG: s_cselect_b64 vcc, -1, 0
; SI-DAG: v_cndmask_b32_e32 v[[SEL:[0-9]+]], 0, {{v[0-9]+}}, vcc
; GCN-DAG: s_cselect_b32 s[[SSEL:[0-9]+]], 0x3ff00000, 0
; GCN-DAG: v_mov_b32_e32 v[[ZERO:[0-9]+]], 0{{$}}
; GCN-DAG: v_mov_b32_e32 v[[SEL:[0-9]+]], s[[SSEL]]
; GCN: flat_store_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, v[[[ZERO]]:[[SEL]]]
; GCN: s_endpgm
define amdgpu_kernel void @uint_to_fp_i1_to_f64(double addrspace(1)* %out, i32 %in) {
Expand Down
331 changes: 161 additions & 170 deletions llvm/test/CodeGen/AMDGPU/urem64.ll

Large diffs are not rendered by default.

12 changes: 6 additions & 6 deletions llvm/test/CodeGen/AMDGPU/vselect.ll
Original file line number Diff line number Diff line change
Expand Up @@ -13,9 +13,9 @@
; VI: s_cselect_b32

; SI-DAG: s_cmp_gt_i32
; SI-DAG: v_cndmask_b32_e64
; SI-DAG: s_cselect_b32
; SI-DAG: s_cmp_gt_i32
; SI-DAG: v_cndmask_b32_e32
; SI-DAG: s_cselect_b32

define amdgpu_kernel void @test_select_v2i32(<2 x i32> addrspace(1)* %out, <2 x i32> addrspace(1)* %in0, <2 x i32> addrspace(1)* %in1, <2 x i32> %val) {
entry:
Expand Down Expand Up @@ -59,10 +59,10 @@ entry:
; VI: s_cselect_b32
; VI: s_cselect_b32

; SI-DAG: v_cndmask_b32_e64
; SI-DAG: v_cndmask_b32_e64
; SI-DAG: v_cndmask_b32_e64
; SI-DAG: v_cndmask_b32_e32
; SI-DAG: s_cselect_b32
; SI-DAG: s_cselect_b32
; SI-DAG: s_cselect_b32
; SI-DAG: s_cselect_b32

define amdgpu_kernel void @test_select_v4i32(<4 x i32> addrspace(1)* %out, <4 x i32> addrspace(1)* %in0, <4 x i32> addrspace(1)* %in1, <4 x i32> %val) {
entry:
Expand Down