|
1 | 1 | ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
|
2 |
| -; RUN: opt < %s -interleaved-access -S | FileCheck %s |
3 | 2 | ; RUN: opt < %s -passes=interleaved-access -S | FileCheck %s
|
4 | 3 |
|
5 | 4 | target triple = "aarch64-linux-gnu"
|
@@ -186,6 +185,22 @@ define void @interleave_nxptr_factor2(ptr %ptr, <vscale x 2 x ptr> %l, <vscale x
|
186 | 185 | ret void
|
187 | 186 | }
|
188 | 187 |
|
| 188 | +define void @interleave_nxi8_factor2_masked_store_splatmask(ptr %ptr, <vscale x 16 x i8> %l, <vscale x 16 x i8> %r, i1 %mask) #0 { |
| 189 | +; CHECK-LABEL: define void @interleave_nxi8_factor2_masked_store_splatmask |
| 190 | +; CHECK-SAME: (ptr [[PTR:%.*]], <vscale x 16 x i8> [[L:%.*]], <vscale x 16 x i8> [[R:%.*]], i1 [[MASK:%.*]]) #[[ATTR0]] { |
| 191 | +; CHECK-NEXT: [[INTERLEAVE:%.*]] = tail call <vscale x 32 x i8> @llvm.vector.interleave2.nxv32i8(<vscale x 16 x i8> [[L]], <vscale x 16 x i8> [[R]]) |
| 192 | +; CHECK-NEXT: [[MASK_INS:%.*]] = insertelement <vscale x 32 x i1> poison, i1 [[MASK]], i64 0 |
| 193 | +; CHECK-NEXT: [[MASK_SPLAT:%.*]] = shufflevector <vscale x 32 x i1> [[MASK_INS]], <vscale x 32 x i1> poison, <vscale x 32 x i32> zeroinitializer |
| 194 | +; CHECK-NEXT: tail call void @llvm.masked.store.nxv32i8.p0(<vscale x 32 x i8> [[INTERLEAVE]], ptr [[PTR]], i32 1, <vscale x 32 x i1> [[MASK_SPLAT]]) |
| 195 | +; CHECK-NEXT: ret void |
| 196 | +; |
| 197 | + %interleave = tail call <vscale x 32 x i8> @llvm.vector.interleave2.nxv32i8(<vscale x 16 x i8> %l, <vscale x 16 x i8> %r) |
| 198 | + %mask.ins = insertelement <vscale x 32 x i1> poison, i1 %mask, i64 0 |
| 199 | + %mask.splat = shufflevector <vscale x 32 x i1> %mask.ins, <vscale x 32 x i1> poison, <vscale x 32 x i32> zeroinitializer |
| 200 | + tail call void @llvm.masked.store.nxv32i8.p0(<vscale x 32 x i8> %interleave, ptr %ptr, i32 1, <vscale x 32 x i1> %mask.splat) |
| 201 | + ret void |
| 202 | +} |
| 203 | + |
189 | 204 | ;;; Check that we 'legalize' operations that are wider than the target supports.
|
190 | 205 |
|
191 | 206 | define void @deinterleave_wide_nxi32_factor2(ptr %ptr) #0 {
|
|
0 commit comments