Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
6 changes: 6 additions & 0 deletions llvm/lib/Target/AArch64/AArch64SMEInstrInfo.td
Original file line number Diff line number Diff line change
Expand Up @@ -1041,3 +1041,9 @@ let Predicates = [HasSME2, HasSVEBFSCALE] in {
defm BFMUL : sme2_bfmul_single<"bfmul">;
defm BFMUL : sme2_bfmul_multi<"bfmul">;
} //[HasSME2, HasSVEBFSCALE]

let Uses = [FPMR, FPCR] in {
let Predicates = [HasSME2p2, HasSMEF8F32] in {
defm FMOP4A : sme2_fmop4a_fp8_fp32_4way<"fmop4a">;
}
}
35 changes: 35 additions & 0 deletions llvm/lib/Target/AArch64/SMEInstrFormats.td
Original file line number Diff line number Diff line change
Expand Up @@ -5382,3 +5382,38 @@ multiclass sme2_fmop4as_fp16_non_widening<bit S, string mnemonic> {
// Multiple vectors
def _M2Z2Z_H : sme2_fp16_quarter_tile_outer_product<1, 1, S, mnemonic, ZZ_h_mul_r_Lo, ZZ_h_mul_r_Hi>;
}

class sme2_fp8_fp32_quarter_tile_outer_product<bit M, bit N, string mnemonic, RegisterOperand zn_ty, RegisterOperand zm_ty>
: I<(outs TileOp32:$ZAda),
(ins TileOp32:$_ZAda, zn_ty:$Zn, zm_ty:$Zm),
mnemonic, "\t$ZAda, $Zn, $Zm",
"", []>, Sched<[]> {
bits<2> ZAda;
bits<3> Zn;
bits<3> Zm;

let Inst{31-21} = 0b10000000001;
let Inst{20} = M;
let Inst{19-17} = Zm;
let Inst{16-10} = 0b0000000;
let Inst{9} = N;
let Inst{8-6} = Zn;
let Inst{5-2} = 0b0000;
let Inst{1-0} = ZAda;

let Constraints = "$ZAda = $_ZAda";
}

multiclass sme2_fmop4a_fp8_fp32_4way<string mnemonic> {
// Single vectors
def _MZZ_BtoS : sme2_fp8_fp32_quarter_tile_outer_product<0, 0, mnemonic, ZPR8Mul2_Lo, ZPR8Mul2_Hi>;

// Multiple and single vectors
def _M2ZZ_BtoS : sme2_fp8_fp32_quarter_tile_outer_product<0, 1, mnemonic, ZZ_b_mul_r_Lo, ZPR8Mul2_Hi>;

// Single and multiple vectors
def _MZ2Z_BtoS : sme2_fp8_fp32_quarter_tile_outer_product<1, 0, mnemonic, ZPR8Mul2_Lo, ZZ_b_mul_r_Hi>;

// Multiple vectors
def _M2Z2Z_BtoS : sme2_fp8_fp32_quarter_tile_outer_product<1, 1, mnemonic, ZZ_b_mul_r_Lo, ZZ_b_mul_r_Hi>;
}
120 changes: 120 additions & 0 deletions llvm/test/MC/AArch64/SME2p2/fmop4a-fp8-fp32-widening-diagnostics.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,120 @@
// RUN: not llvm-mc -triple=aarch64 -mattr=+sme2p2,+sme-f8f32 < %s 2>&1 | FileCheck %s

// Single vectors

fmop4a za0.d, z0.b, z16.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid matrix operand

fmop4a za4.s, z0.b, z16.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid operand for instruction

fmop4a za0.s, z0.d, z16.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid restricted vector register, expected even register in z0.b..z14.b

fmop4a za0.s, z15.b, z16.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid restricted vector register, expected even register in z0.b..z14.b

fmop4a za0.s, z16.b, z16.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid restricted vector register, expected even register in z0.b..z14.b

fmop4a za0.s, z0.b, z16.s
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid restricted vector register, expected even register in z16.b..z30.b

fmop4a za0.s, z12.b, z17.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid restricted vector register, expected even register in z16.b..z30.b

fmop4a za0.s, z12.b, z14.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid restricted vector register, expected even register in z16.b..z30.b

fmop4a za0.s, z12.b, z31.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid restricted vector register, expected even register in z16.b..z30.b

// Single and multiple vectors

fmop4a za0.d, z0.b, {z16.b-z17.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid matrix operand

fmop4a za4.s, z0.b, {z16.b-z17.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid operand for instruction

fmop4a za0.s, z0.d, {z16.b-z17.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid restricted vector register, expected even register in z0.b..z14.b

fmop4a za0.s, z1.b, {z16.b-z17.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid restricted vector register, expected even register in z0.b..z14.b

fmop4a za0.s, z16.b, {z16.b-z17.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid restricted vector register, expected even register in z0.b..z14.b

fmop4a za0.s, z0.b, {z16.s-z17.s}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid operand for instruction

fmop4a za0.s, z0.b, {z17.b-z18.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid vector list, expected list with 2 consecutive SVE vectors in the range z16-z30, where the first vector is a multiple of 2 and with matching element types

fmop4a za0.s, z0.b, {z16.b-z18.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid operand for instruction

fmop4a za0.s, z0.b, {z12.b-z13.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid vector list, expected list with 2 consecutive SVE vectors in the range z16-z30, where the first vector is a multiple of 2 and with matching element types

// Multiple and single vectors

fmop4a za0.d, {z0.b-z1.b}, z16.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid matrix operand

fmop4a za4.s, {z0.b-z1.b}, z16.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid operand for instruction

fmop4a za0.s, {z0.s-z1.b}, z16.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: mismatched register size suffix

fmop4a za0.s, {z1.b-z2.b}, z16.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid vector list, expected list with 2 consecutive SVE vectors in the range z0-z14, where the first vector is a multiple of 2 and with matching element types

fmop4a za0.s, {z0.b-z2.b}, z16.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid operand for instruction

fmop4a za0.s, {z16.b-z17.b}, z16.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid vector list, expected list with 2 consecutive SVE vectors in the range z0-z14, where the first vector is a multiple of 2 and with matching element types

fmop4a za0.s, {z0.b-z1.b}, z16.d
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid restricted vector register, expected even register in z16.b..z30.b

fmop4a za0.s, {z0.b-z1.b}, z17.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid restricted vector register, expected even register in z16.b..z30.b

fmop4a za0.s, {z0.b-z1.b}, z12.b
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid restricted vector register, expected even register in z16.b..z30.b

// Multiple vectors

fmop4a za0.d, {z0.b-z1.b}, {z16.b-z17.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid matrix operand

fmop4a za4.s, {z0.b-z1.b}, {z16.b-z17.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid operand for instruction

fmop4a za0.s, {z0.s-z1.s}, {z16.b-z17.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid operand for instruction

fmop4a za0.s, {z1.b-z2.b}, {z16.b-z17.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid vector list, expected list with 2 consecutive SVE vectors in the range z0-z14, where the first vector is a multiple of 2 and with matching element types

fmop4a za0.s, {z0.b-z2.b}, {z16.b-z17.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid operand for instruction

fmop4a za0.s, {z18.b-z19.b}, {z16.b-z17.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid vector list, expected list with 2 consecutive SVE vectors in the range z0-z14, where the first vector is a multiple of 2 and with matching element types

fmop4a za0.s, {z0.b-z1.b}, {z16.s-z17.s}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid operand for instruction

fmop4a za0.s, {z0.b-z1.b}, {z19.b-z20.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid vector list, expected list with 2 consecutive SVE vectors in the range z16-z30, where the first vector is a multiple of 2 and with matching element types

fmop4a za0.s, {z0.b-z1.b}, {z18.b-z20.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid operand for instruction

fmop4a za0.s, {z0.b-z1.b}, {z10.b-z11.b}
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: Invalid vector list, expected list with 2 consecutive SVE vectors in the range z16-z30, where the first vector is a multiple of 2 and with matching element types
93 changes: 93 additions & 0 deletions llvm/test/MC/AArch64/SME2p2/fmop4a-fp8-fp32-widening.s
Original file line number Diff line number Diff line change
@@ -0,0 +1,93 @@
// RUN: llvm-mc -triple=aarch64 -show-encoding -mattr=+sme2p2,+sme-f8f32 < %s \
// RUN: | FileCheck %s --check-prefixes=CHECK-ENCODING,CHECK-INST
// RUN: not llvm-mc -triple=aarch64 -show-encoding < %s 2>&1 \
// RUN: | FileCheck %s --check-prefix=CHECK-ERROR
// RUN: llvm-mc -triple=aarch64 -filetype=obj -mattr=+sme2p2,+sme-f8f32 < %s \
// RUN: | llvm-objdump -d --mattr=+sme2p2,+sme-f8f32 - | FileCheck %s --check-prefix=CHECK-INST
// RUN: llvm-mc -triple=aarch64 -filetype=obj -mattr=+sme2p2,+sme-f8f32 < %s \
// RUN: | llvm-objdump -d --mattr=-sme2p2 - | FileCheck %s --check-prefix=CHECK-UNKNOWN
// Disassemble encoding and check the re-encoding (-show-encoding) matches.
// RUN: llvm-mc -triple=aarch64 -show-encoding -mattr=+sme2p2,+sme-f8f32 < %s \
// RUN: | sed '/.text/d' | sed 's/.*encoding: //g' \
// RUN: | llvm-mc -triple=aarch64 -mattr=+sme2p2,+sme-f8f32 -disassemble -show-encoding \
// RUN: | FileCheck %s --check-prefixes=CHECK-ENCODING,CHECK-INST

// Single vectors

fmop4a za0.s, z0.b, z16.b // 10000000-00100000-00000000-00000000
// CHECK-INST: fmop4a za0.s, z0.b, z16.b
// CHECK-ENCODING: [0x00,0x00,0x20,0x80]
// CHECK-ERROR: instruction requires: sme2p2 sme-f8f32
// CHECK-UNKNOWN: 80200000 <unknown>

fmop4a za1.s, z10.b, z20.b // 10000000-00100100-00000001-01000001
// CHECK-INST: fmop4a za1.s, z10.b, z20.b
// CHECK-ENCODING: [0x41,0x01,0x24,0x80]
// CHECK-ERROR: instruction requires: sme2p2 sme-f8f32
// CHECK-UNKNOWN: 80240141 <unknown>

fmop4a za3.s, z14.b, z30.b // 10000000-00101110-00000001-11000011
// CHECK-INST: fmop4a za3.s, z14.b, z30.b
// CHECK-ENCODING: [0xc3,0x01,0x2e,0x80]
// CHECK-ERROR: instruction requires: sme2p2 sme-f8f32
// CHECK-UNKNOWN: 802e01c3 <unknown>

// Single and multiple vectors

fmop4a za0.s, z0.b, {z16.b-z17.b} // 10000000-00110000-00000000-00000000
// CHECK-INST: fmop4a za0.s, z0.b, { z16.b, z17.b }
// CHECK-ENCODING: [0x00,0x00,0x30,0x80]
// CHECK-ERROR: instruction requires: sme2p2 sme-f8f32
// CHECK-UNKNOWN: 80300000 <unknown>

fmop4a za1.s, z10.b, {z20.b-z21.b} // 10000000-00110100-00000001-01000001
// CHECK-INST: fmop4a za1.s, z10.b, { z20.b, z21.b }
// CHECK-ENCODING: [0x41,0x01,0x34,0x80]
// CHECK-ERROR: instruction requires: sme2p2 sme-f8f32
// CHECK-UNKNOWN: 80340141 <unknown>

fmop4a za3.s, z14.b, {z30.b-z31.b} // 10000000-00111110-00000001-11000011
// CHECK-INST: fmop4a za3.s, z14.b, { z30.b, z31.b }
// CHECK-ENCODING: [0xc3,0x01,0x3e,0x80]
// CHECK-ERROR: instruction requires: sme2p2 sme-f8f32
// CHECK-UNKNOWN: 803e01c3 <unknown>

// Multiple and single vectors

fmop4a za0.s, {z0.b-z1.b}, z16.b // 10000000-00100000-00000010-00000000
// CHECK-INST: fmop4a za0.s, { z0.b, z1.b }, z16.b
// CHECK-ENCODING: [0x00,0x02,0x20,0x80]
// CHECK-ERROR: instruction requires: sme2p2 sme-f8f32
// CHECK-UNKNOWN: 80200200 <unknown>

fmop4a za1.s, {z10.b-z11.b}, z20.b // 10000000-00100100-00000011-01000001
// CHECK-INST: fmop4a za1.s, { z10.b, z11.b }, z20.b
// CHECK-ENCODING: [0x41,0x03,0x24,0x80]
// CHECK-ERROR: instruction requires: sme2p2 sme-f8f32
// CHECK-UNKNOWN: 80240341 <unknown>

fmop4a za3.s, {z14.b-z15.b}, z30.b // 10000000-00101110-00000011-11000011
// CHECK-INST: fmop4a za3.s, { z14.b, z15.b }, z30.b
// CHECK-ENCODING: [0xc3,0x03,0x2e,0x80]
// CHECK-ERROR: instruction requires: sme2p2 sme-f8f32
// CHECK-UNKNOWN: 802e03c3 <unknown>

// Multiple vectors

fmop4a za0.s, {z0.b-z1.b}, {z16.b-z17.b} // 10000000-00110000-00000010-00000000
// CHECK-INST: fmop4a za0.s, { z0.b, z1.b }, { z16.b, z17.b }
// CHECK-ENCODING: [0x00,0x02,0x30,0x80]
// CHECK-ERROR: instruction requires: sme2p2 sme-f8f32
// CHECK-UNKNOWN: 80300200 <unknown>

fmop4a za1.s, {z10.b-z11.b}, {z20.b-z21.b} // 10000000-00110100-00000011-01000001
// CHECK-INST: fmop4a za1.s, { z10.b, z11.b }, { z20.b, z21.b }
// CHECK-ENCODING: [0x41,0x03,0x34,0x80]
// CHECK-ERROR: instruction requires: sme2p2 sme-f8f32
// CHECK-UNKNOWN: 80340341 <unknown>

fmop4a za3.s, {z14.b-z15.b}, {z30.b-z31.b} // 10000000-00111110-00000011-11000011
// CHECK-INST: fmop4a za3.s, { z14.b, z15.b }, { z30.b, z31.b }
// CHECK-ENCODING: [0xc3,0x03,0x3e,0x80]
// CHECK-ERROR: instruction requires: sme2p2 sme-f8f32
// CHECK-UNKNOWN: 803e03c3 <unknown>
Loading