[clang] [llvm] Add support for Armv9.6-A memory systems extensions (PR #112341)
Nashe Mncube via cfe-commits
cfe-commits at lists.llvm.org
Tue Oct 15 02:29:32 PDT 2024
https://github.com/nasherm created https://github.com/llvm/llvm-project/pull/112341
Add support for the following Armv9.6-A memory systems extensions:
FEAT_LSUI - Unprivileged Load Store
FEAT_OCCMO - Outer Cacheable Cache Maintenance Operation
FEAT_PCDPHINT - Producer-Consumer Data Placement Hints
FEAT_SRMASK - Bitwise System Register Write Masks
as documented here:
https://developer.arm.com/documentation/109697/2024_09/Feature-descriptions/The-Armv9-6-architecture-extension
>From 345f58ec293e3b5861965726403b53b5fff47255 Mon Sep 17 00:00:00 2001
From: Nashe Mncube <nashe.mncube at arm.com>
Date: Fri, 4 Oct 2024 10:22:10 +0100
Subject: [PATCH] Add support for Armv9.6-A memory systems extensions
Add support for the following Armv9.6-A memory systems extensions:
FEAT_LSUI - Unprivileged Load Store
FEAT_OCCMO - Outer Cacheable Cache Maintenance Operation
FEAT_PCDPHINT - Producer-Consumer Data Placement Hints
FEAT_SRMASK - Bitwise System Register Write Masks
as documented here:
https://developer.arm.com/documentation/109697/2024_09/Feature-descriptions/The-Armv9-6-architecture-extension
Co-authored-by: Jonathan Thackray <jonathan.thackray at arm.com>
Change-Id: Icbbdd194b8885d8a1b9d513faf0b85e74011201d
---
clang/test/Driver/aarch64-v96a.c | 13 +
.../print-supported-extensions-aarch64.c | 3 +
llvm/lib/Target/AArch64/AArch64Features.td | 12 +-
.../lib/Target/AArch64/AArch64InstrFormats.td | 304 ++++++++++++++
llvm/lib/Target/AArch64/AArch64InstrInfo.td | 101 +++++
.../Target/AArch64/AArch64SystemOperands.td | 67 +++
.../AArch64/AsmParser/AArch64AsmParser.cpp | 61 ++-
.../Disassembler/AArch64Disassembler.cpp | 24 ++
.../MCTargetDesc/AArch64InstPrinter.cpp | 27 ++
.../AArch64/MCTargetDesc/AArch64InstPrinter.h | 2 +
.../Target/AArch64/Utils/AArch64BaseInfo.cpp | 7 +
.../Target/AArch64/Utils/AArch64BaseInfo.h | 20 +
llvm/test/MC/AArch64/armv9.6a-lsui.s | 395 ++++++++++++++++++
llvm/test/MC/AArch64/armv9.6a-occmo.s | 14 +
llvm/test/MC/AArch64/armv9.6a-pcdphint.s | 12 +
llvm/test/MC/AArch64/armv9.6a-rme-gpc3.s | 12 +
llvm/test/MC/AArch64/armv9.6a-srmask.s | 104 +++++
.../MC/Disassembler/AArch64/armv9.6a-lsui.txt | 324 ++++++++++++++
.../Disassembler/AArch64/armv9.6a-occmo.txt | 12 +
.../AArch64/armv9.6a-pcdphint.txt | 9 +
.../AArch64/armv9.6a-rme-gpc3.txt | 11 +
.../Disassembler/AArch64/armv9.6a-srmask.txt | 102 +++++
.../TargetParser/TargetParserTest.cpp | 10 +-
23 files changed, 1641 insertions(+), 5 deletions(-)
create mode 100644 llvm/test/MC/AArch64/armv9.6a-lsui.s
create mode 100644 llvm/test/MC/AArch64/armv9.6a-occmo.s
create mode 100644 llvm/test/MC/AArch64/armv9.6a-pcdphint.s
create mode 100644 llvm/test/MC/AArch64/armv9.6a-rme-gpc3.s
create mode 100644 llvm/test/MC/AArch64/armv9.6a-srmask.s
create mode 100644 llvm/test/MC/Disassembler/AArch64/armv9.6a-lsui.txt
create mode 100644 llvm/test/MC/Disassembler/AArch64/armv9.6a-occmo.txt
create mode 100644 llvm/test/MC/Disassembler/AArch64/armv9.6a-pcdphint.txt
create mode 100644 llvm/test/MC/Disassembler/AArch64/armv9.6a-rme-gpc3.txt
create mode 100644 llvm/test/MC/Disassembler/AArch64/armv9.6a-srmask.txt
diff --git a/clang/test/Driver/aarch64-v96a.c b/clang/test/Driver/aarch64-v96a.c
index 0aaadddb2842f8..fd24585acf24f2 100644
--- a/clang/test/Driver/aarch64-v96a.c
+++ b/clang/test/Driver/aarch64-v96a.c
@@ -17,3 +17,16 @@
// GENERICV96A-BE: "-cc1"{{.*}} "-triple" "aarch64_be{{.*}}" "-target-cpu" "generic" "-target-feature" "+v9.6a"
//
// ===== Features supported on aarch64 =====
+//
+// RUN: %clang -target aarch64 -march=armv9.6a+lsui -### -c %s 2>&1 | FileCheck -check-prefix=V96A-LSUI %s
+// RUN: %clang -target aarch64 -march=armv9.6-a+lsui -### -c %s 2>&1 | FileCheck -check-prefix=V96A-LSUI %s
+// V96A-LSUI: "-cc1"{{.*}} "-triple" "aarch64{{.*}}" "-target-cpu" "generic" "-target-feature" "+v9.6a"{{.*}} "-target-feature" "+lsui"
+//
+// RUN: %clang -target aarch64 -march=armv9.6a+occmo -### -c %s 2>&1 | FileCheck -check-prefix=V96A-OCCMO %s
+// RUN: %clang -target aarch64 -march=armv9.6-a+occmo -### -c %s 2>&1 | FileCheck -check-prefix=V96A-OCCMO %s
+// V96A-OCCMO: "-cc1"{{.*}} "-triple" "aarch64{{.*}}" "-target-cpu" "generic" "-target-feature" "+v9.6a"{{.*}} "-target-feature" "+occmo"
+//
+// RUN: %clang -target aarch64 -march=armv9.6a+pcdphint -### -c %s 2>&1 | FileCheck -check-prefix=V96A-PCDPHINT %s
+// RUN: %clang -target aarch64 -march=armv9.6-a+pcdphint -### -c %s 2>&1 | FileCheck -check-prefix=V96A-PCDPHINT %s
+// V96A-PCDPHINT: "-cc1"{{.*}} "-triple" "aarch64{{.*}}" "-target-cpu" "generic" "-target-feature" "+v9.6a"{{.*}} "-target-feature" "+pcdphint"
+//
diff --git a/clang/test/Driver/print-supported-extensions-aarch64.c b/clang/test/Driver/print-supported-extensions-aarch64.c
index e6247307c7219f..642df4b699ecc3 100644
--- a/clang/test/Driver/print-supported-extensions-aarch64.c
+++ b/clang/test/Driver/print-supported-extensions-aarch64.c
@@ -35,12 +35,15 @@
// CHECK-NEXT: ls64 FEAT_LS64, FEAT_LS64_V, FEAT_LS64_ACCDATA Enable Armv8.7-A LD64B/ST64B Accelerator Extension
// CHECK-NEXT: lse FEAT_LSE Enable Armv8.1-A Large System Extension (LSE) atomic instructions
// CHECK-NEXT: lse128 FEAT_LSE128 Enable Armv9.4-A 128-bit Atomic instructions
+// CHECK-NEXT: lsui FEAT_LSUI Enable Armv9.6-A unprivileged load/store instructions
// CHECK-NEXT: lut FEAT_LUT Enable Lookup Table instructions
// CHECK-NEXT: mops FEAT_MOPS Enable Armv8.8-A memcpy and memset acceleration instructions
// CHECK-NEXT: memtag FEAT_MTE, FEAT_MTE2 Enable Memory Tagging Extension
// CHECK-NEXT: simd FEAT_AdvSIMD Enable Advanced SIMD instructions
+// CHECK-NEXT: occmo FEAT_OCCMO Enable Armv9.6-A Outer cacheable cache maintenance operations
// CHECK-NEXT: pauth FEAT_PAuth Enable Armv8.3-A Pointer Authentication extension
// CHECK-NEXT: pauth-lr FEAT_PAuth_LR Enable Armv9.5-A PAC enhancements
+// CHECK-NEXT: pcdphint FEAT_PCDPHINT Enable Armv9.6-A Producer Consumer Data Placement hints
// CHECK-NEXT: pmuv3 FEAT_PMUv3 Enable Armv8.0-A PMUv3 Performance Monitors extension
// CHECK-NEXT: predres FEAT_SPECRES Enable Armv8.5-A execution and data prediction invalidation instructions
// CHECK-NEXT: rng FEAT_RNG Enable Random Number generation instructions
diff --git a/llvm/lib/Target/AArch64/AArch64Features.td b/llvm/lib/Target/AArch64/AArch64Features.td
index 97671bc59f6b9e..2b391533fd2821 100644
--- a/llvm/lib/Target/AArch64/AArch64Features.td
+++ b/llvm/lib/Target/AArch64/AArch64Features.td
@@ -522,6 +522,14 @@ def FeatureTLBIW : ExtensionWithMArch<"tlbiw", "TLBIW", "FEAT_TLBIW",
// Armv9.6 Architecture Extensions
//===----------------------------------------------------------------------===//
+def FeatureLSUI: ExtensionWithMArch<"lsui", "LSUI", "FEAT_LSUI",
+ "Enable Armv9.6-A unprivileged load/store instructions">;
+
+def FeatureOCCMO: ExtensionWithMArch<"occmo", "OCCMO", "FEAT_OCCMO",
+ "Enable Armv9.6-A Outer cacheable cache maintenance operations">;
+
+def FeaturePCDPHINT: ExtensionWithMArch<"pcdphint", "PCDPHINT", "FEAT_PCDPHINT",
+ "Enable Armv9.6-A Producer Consumer Data Placement hints">;
//===----------------------------------------------------------------------===//
// Other Features
@@ -833,8 +841,8 @@ def HasV9_5aOps : Architecture64<9, 5, "a", "v9.5a",
[HasV9_4aOps, FeatureCPA],
!listconcat(HasV9_4aOps.DefaultExts, [FeatureCPA, FeatureLUT, FeatureFAMINMAX])>;
def HasV9_6aOps : Architecture64<9, 6, "a", "v9.6a",
- [HasV9_5aOps],
- !listconcat(HasV9_5aOps.DefaultExts, [])>;
+ [HasV9_5aOps, FeatureLSUI, FeatureOCCMO],
+ !listconcat(HasV9_5aOps.DefaultExts, [FeatureLSUI, FeatureOCCMO])>;
def HasV8_0rOps : Architecture64<8, 0, "r", "v8r",
[ //v8.1
FeatureCRC, FeaturePAN, FeatureLSE, FeatureCONTEXTIDREL2,
diff --git a/llvm/lib/Target/AArch64/AArch64InstrFormats.td b/llvm/lib/Target/AArch64/AArch64InstrFormats.td
index 1d1d9b5512cfc7..5eb780d8347fc3 100644
--- a/llvm/lib/Target/AArch64/AArch64InstrFormats.td
+++ b/llvm/lib/Target/AArch64/AArch64InstrFormats.td
@@ -1729,6 +1729,11 @@ class TMSystemException<bits<3> op1, string asm, list<dag> pattern>
let Inst{4-0} = 0b00000;
}
+class APASI : SimpleSystemI<0, (ins GPR64:$Xt), "apas", "\t$Xt">, Sched<[]> {
+ let Inst{20-5} = 0b0111001110000000;
+ let DecoderNamespace = "APAS";
+}
+
// Hint instructions that take both a CRm and a 3-bit immediate.
// NOTE: ideally, this would have mayStore = 0, mayLoad = 0, but we cannot
// model patterns with sufficiently fine granularity
@@ -1742,6 +1747,25 @@ let mayStore = 1, mayLoad = 1, hasSideEffects = 1 in
let Inst{11-5} = imm;
}
+def PHintInstOperand : AsmOperandClass {
+ let Name = "PHint";
+ let ParserMethod = "tryParsePHintInstOperand";
+}
+
+def phint_op : Operand<i32> {
+ let ParserMatchClass = PHintInstOperand;
+ let PrintMethod = "printPHintOp";
+}
+
+class STSHHI
+ : SimpleSystemI<0, (ins phint_op:$policy), "stshh", "\t$policy", []>,
+ Sched<[WriteHint]> {
+ bits<3> policy;
+ let Inst{20-12} = 0b000110010;
+ let Inst{11-8} = 0b0110;
+ let Inst{7-5} = policy;
+}
+
// System instructions taking a single literal operand which encodes into
// CRm. op2 differentiates the opcodes.
def BarrierAsmOperand : AsmOperandClass {
@@ -4689,6 +4713,56 @@ multiclass StorePairNoAlloc<bits<2> opc, bit V, DAGOperand regtype,
GPR64sp:$Rn, 0)>;
}
+// armv9.6-a load/store no-allocate pair FEAT_LSUI (no-allocate)
+
+class BaseLoadStorePairNoAllocLSUI<bits<2> opc, bit V, bit L, dag oops, dag iops,
+ string asm>
+ : I<oops, iops, asm, "\t$Rt, $Rt2, [$Rn, $offset]", "", []> {
+ bits<5> Rt;
+ bits<5> Rt2;
+ bits<5> Rn;
+ bits<7> offset;
+ let Inst{31-30} = opc;
+ let Inst{29-27} = 0b101;
+ let Inst{26} = V;
+ let Inst{25-23} = 0b000;
+ let Inst{22} = L;
+ let Inst{21-15} = offset;
+ let Inst{14-10} = Rt2;
+ let Inst{9-5} = Rn;
+ let Inst{4-0} = Rt;
+
+ let DecoderMethod = "DecodePairLdStInstruction";
+}
+
+multiclass LoadPairNoAllocLSUI<bits<2> opc, bit V, DAGOperand regtype,
+ Operand indextype, string asm> {
+ let hasSideEffects = 0, mayStore = 0, mayLoad = 1 in
+ def i : BaseLoadStorePairNoAllocLSUI<opc, V, 1,
+ (outs regtype:$Rt, regtype:$Rt2),
+ (ins GPR64sp:$Rn, indextype:$offset), asm>,
+ Sched<[WriteLD, WriteLDHi]>;
+
+
+ def : InstAlias<asm # "\t$Rt, $Rt2, [$Rn]",
+ (!cast<Instruction>(NAME # "i") regtype:$Rt, regtype:$Rt2,
+ GPR64sp:$Rn, 0)>;
+}
+
+multiclass StorePairNoAllocLSUI<bits<2> opc, bit V, DAGOperand regtype,
+ Operand indextype, string asm> {
+ let hasSideEffects = 0, mayStore = 1, mayLoad = 0 in
+ def i : BaseLoadStorePairNoAllocLSUI<opc, V, 0, (outs),
+ (ins regtype:$Rt, regtype:$Rt2,
+ GPR64sp:$Rn, indextype:$offset),
+ asm>,
+ Sched<[WriteSTP]>;
+
+ def : InstAlias<asm # "\t$Rt, $Rt2, [$Rn]",
+ (!cast<Instruction>(NAME # "i") regtype:$Rt, regtype:$Rt2,
+ GPR64sp:$Rn, 0)>;
+}
+
//---
// Load/store exclusive
//---
@@ -4769,6 +4843,109 @@ class LoadExclusivePair<bits<2> sz, bit o2, bit L, bit o1, bit o0,
let PostEncoderMethod = "fixLoadStoreExclusive<0,1>";
}
+// Armv9.6-a load-store exclusive instructions
+let hasSideEffects = 1, mayLoad = 1, mayStore = 1 in
+class BaseLoadStoreExclusiveLSUI<bits<2> sz, bit L, bit o0,
+ dag oops, dag iops, string asm, string operands>
+ : I<oops, iops, asm, operands, "", []> {
+ let Inst{31-30} = sz;
+ let Inst{29-23} = 0b0010010;
+ let Inst{22} = L;
+ let Inst{15} = o0;
+}
+
+
+// Neither Rs nor Rt2 operands.
+
+class LoadExclusiveLSUI<bits<2> sz, bit L, bit o0,
+ RegisterClass regtype, string asm>
+ : BaseLoadStoreExclusiveLSUI<sz, L, o0, (outs regtype:$Rt),
+ (ins GPR64sp0:$Rn), asm, "\t$Rt, [$Rn]">,
+ Sched<[WriteLD]>
+{
+ bits<5> Rt;
+ bits<5> Rn;
+ let Inst{20-16} = 0b11111;
+ let Unpredictable{20-16} = 0b11111;
+ let Inst{14-10} = 0b11111;
+ let Unpredictable{14-10} = 0b11111;
+ let Inst{9-5} = Rn;
+ let Inst{4-0} = Rt;
+
+ let PostEncoderMethod = "fixLoadStoreExclusive<0,0>";
+}
+
+ class StoreExclusiveLSUI<bits<2> sz, bit L, bit o0,
+ RegisterClass regtype, string asm>
+ : BaseLoadStoreExclusiveLSUI<sz, L, o0, (outs GPR32:$Ws),
+ (ins regtype:$Rt, GPR64sp0:$Rn),
+ asm, "\t$Ws, $Rt, [$Rn]">,
+ Sched<[WriteSTX]> {
+ bits<5> Ws;
+ bits<5> Rt;
+ bits<5> Rn;
+ let Inst{20-16} = Ws;
+ let Inst{15} = o0;
+ let Inst{14-10} = 0b11111;
+ let Unpredictable{14-10} = 0b11111;
+ let Inst{9-5} = Rn;
+ let Inst{4-0} = Rt;
+
+ let Constraints = "@earlyclobber $Ws";
+ let PostEncoderMethod = "fixLoadStoreExclusive<1,0>";
+ }
+
+// Armv9.6-a load-store unprivileged instructions
+class BaseLoadUnprivilegedLSUI<bits<2> sz, dag oops, dag iops, string asm>
+ : I<oops, iops, asm, "\t$Rt, [$Rn]", "", []> {
+ bits<5> Rt;
+ bits<5> Rn;
+ let Inst{31-30} = sz;
+ let Inst{29-23} = 0b0010010;
+ let Inst{22} = 0b1;
+ let Inst{21} = 0b0;
+ let Inst{20-16} = 0b11111;
+ let Unpredictable{20-16} = 0b11111;
+ let Inst{15} = 0b0;
+ let Inst{14-10} = 0b11111;
+ let Unpredictable{14-10} = 0b11111;
+ let Inst{9-5} = Rn;
+ let Inst{4-0} = Rt;
+ let PostEncoderMethod = "fixLoadStoreExclusive<0,0>";
+}
+
+multiclass LoadUnprivilegedLSUI<bits<2> sz, RegisterClass regtype, string asm> {
+ def i : BaseLoadUnprivilegedLSUI<sz, (outs regtype:$Rt),
+ (ins GPR64sp0:$Rn), asm>,
+ Sched<[WriteLD]>;
+
+}
+
+class BaseStoreUnprivilegedLSUI<bits<2> sz, dag oops, dag iops, string asm>
+ : I<oops, iops, asm, "\t$Ws, $Rt, [$Rn]", "", []> {
+ bits<5> Rt;
+ bits<5> Rn;
+ bits<5> Ws;
+ let Inst{31-30} = sz;
+ let Inst{29-23} = 0b0010010;
+ let Inst{22} = 0b0;
+ let Inst{21} = 0b0;
+ let Inst{20-16} = Ws;
+ let Inst{15} = 0b0;
+ let Inst{14-10} = 0b11111;
+ let Unpredictable{14-10} = 0b11111;
+ let Inst{9-5} = Rn;
+ let Inst{4-0} = Rt;
+ let PostEncoderMethod = "fixLoadStoreExclusive<1,0>";
+}
+
+multiclass StoreUnprivilegedLSUI<bits<2> sz, RegisterClass regtype, string asm> {
+ def i : BaseStoreUnprivilegedLSUI<sz, (outs GPR32: $Ws),
+ (ins regtype:$Rt, GPR64sp0:$Rn),
+ asm>,
+ Sched<[WriteSTX]>;
+}
+
// Simple store release operations do not check the exclusive monitor.
let mayLoad = 0, mayStore = 1 in
class StoreRelease<bits<2> sz, bit o2, bit L, bit o1, bit o0,
@@ -11845,6 +12022,48 @@ multiclass CompareAndSwapPair<bits<1> Acq, bits<1> Rel, string order> {
def X : BaseCASP<order, "", XSeqPairClassOperand>;
}
+// v9.6-a CAST unprivileged instructions
+let mayLoad = 1, mayStore = 1, hasSideEffects = 1 in
+class BaseCASTEncoding<dag oops, dag iops, string asm,
+ string cstr, list<dag> pattern>
+ : I<oops, iops, asm, "\t$Rs, $Rt, [$Rn]", cstr, pattern> {
+ bits<5> Rs;
+ bits<5> Rn;
+ bits<5> Rt;
+ bit L;
+ bit o0;
+ bits<2> Sz;
+ let Inst{31-30} = Sz;
+ let Inst{29-23} = 0b0010011;
+ let Inst{22} = L;
+ let Inst{21} = 0b0;
+ let Inst{20-16} = Rs;
+ let Inst{15} = o0;
+ let Inst{14-10} = 0b11111;
+ let Unpredictable{14-10} = 0b11111;
+ let Inst{9-5} = Rn;
+ let Inst{4-0} = Rt;
+}
+
+multiclass CompareAndSwapUnprivileged<bits<2> Sz, bit L, bit o0, string order> {
+ let Sz = Sz, L = L, o0 = o0 in
+ def X : BaseCASTEncoding <
+ (outs GPR64:$out),
+ (ins GPR64:$Rs, GPR64:$Rt, GPR64sp0:$Rn),
+ "cas" # order # "t",
+ "$out = $Rs",[]>, Sched<[WriteAtomic]>;
+
+}
+
+multiclass CompareAndSwapPairUnprivileged<bits<2> Sz, bit L, bit o0, string order> {
+ let Sz = Sz, L = L, o0 = o0 in
+ def X : BaseCASTEncoding<(outs XSeqPairClassOperand:$out),
+ (ins XSeqPairClassOperand:$Rs, XSeqPairClassOperand:$Rt, GPR64sp0:$Rn),
+ "casp" # order # "t",
+ "$out = $Rs",[]>,
+ Sched<[WriteAtomic]>;
+}
+
let Predicates = [HasLSE] in
class BaseSWP<string order, string size, RegisterClass RC>
: I<(outs RC:$Rt),(ins RC:$Rs, GPR64sp:$Rn), "swp" # order # size,
@@ -11878,6 +12097,35 @@ multiclass Swap<bits<1> Acq, bits<1> Rel, string order> {
let Sz = 0b11, Acq = Acq, Rel = Rel in def X : BaseSWP<order, "", GPR64>;
}
+// v9.6a swap operations
+class BaseSWPLSUI<string order, RegisterClass RC>
+ : I<(outs RC:$Rt),(ins RC:$Rs, GPR64sp:$Rn), "swpt" # order,
+ "\t$Rs, $Rt, [$Rn]","",[]>,
+ Sched<[WriteAtomic]> {
+ bits<2> Sz;
+ bit Acq;
+ bit Rel;
+ bits<5> Rs;
+ bits<5> Rn;
+ bits<5> Rt;
+ let Inst{31-30} = Sz;
+ let Inst{29-24} = 0b011001;
+ let Inst{23} = Acq;
+ let Inst{22} = Rel;
+ let Inst{21} = 0b1;
+ let Inst{20-16} = Rs;
+ let Inst{15} = 0b1;
+ let Inst{14-12} = 0b000;
+ let Inst{11-10} = 0b01;
+ let Inst{9-5} = Rn;
+ let Inst{4-0} = Rt;
+}
+
+multiclass SwapLSUI<bits<1> Acq, bits<1> Rel, string order> {
+ let Sz = 0b00, Acq = Acq, Rel = Rel in def W : BaseSWPLSUI<order, GPR32>;
+ let Sz = 0b01, Acq = Acq, Rel = Rel in def X : BaseSWPLSUI<order, GPR64>;
+}
+
let Predicates = [HasLSE], mayLoad = 1, mayStore = 1, hasSideEffects = 1 in
class BaseLDOPregister<string op, string order, string size, RegisterClass RC>
: I<(outs RC:$Rt),(ins RC:$Rs, GPR64sp:$Rn), "ld" # op # order # size,
@@ -11916,6 +12164,39 @@ multiclass LDOPregister<bits<3> opc, string op, bits<1> Acq, bits<1> Rel,
def X : BaseLDOPregister<op, order, "", GPR64>;
}
+class BaseLDOPregisterLSUI<string op, string order, RegisterClass RC>
+ : I<(outs RC:$Rt),(ins RC:$Rs, GPR64sp:$Rn), "ldt" # op # order,
+ "\t$Rs, $Rt, [$Rn]","",[]>,
+ Sched<[WriteAtomic]> {
+ bits<2> Sz;
+ bit Acq;
+ bit Rel;
+ bits<5> Rs;
+ bits<3> opc;
+ bits<5> Rn;
+ bits<5> Rt;
+ let Inst{31-30} = Sz;
+ let Inst{29-24} = 0b011001;
+ let Inst{23} = Acq;
+ let Inst{22} = Rel;
+ let Inst{21} = 0b1;
+ let Inst{20-16} = Rs;
+ let Inst{15} = 0b0;
+ let Inst{14-12} = opc;
+ let Inst{11-10} = 0b01;
+ let Inst{9-5} = Rn;
+ let Inst{4-0} = Rt;
+}
+
+
+multiclass LDOPregisterLSUI<bits<3> opc, string op, bits<1> Acq, bits<1> Rel,
+ string order> {
+ let Sz = 0b00, Acq = Acq, Rel = Rel, opc = opc in
+ def W : BaseLDOPregisterLSUI<op, order, GPR32>;
+ let Sz = 0b01, Acq = Acq, Rel = Rel, opc = opc in
+ def X : BaseLDOPregisterLSUI<op, order, GPR64>;
+}
+
// Differing SrcRHS and DstRHS allow you to cover CLR & SUB by giving a more
// complex DAG for DstRHS.
let Predicates = [HasLSE] in
@@ -12020,6 +12301,29 @@ multiclass STOPregister<string asm, string instr> {
!cast<Instruction>(instr # "X")>;
}
+class BaseSTOPregisterLSUI<string asm, RegisterClass OP, Register Reg,
+ Instruction inst> :
+ InstAlias<asm # "\t$Rs, [$Rn]", (inst Reg, OP:$Rs, GPR64sp:$Rn)>;
+
+multiclass STOPregisterLSUI<string asm, string instr> {
+ def : BaseSTOPregisterLSUI<asm # "a", GPR32, WZR,
+ !cast<Instruction>(instr # "W")>;
+ def : BaseSTOPregisterLSUI<asm # "a", GPR64, XZR,
+ !cast<Instruction>(instr # "X")>;
+ def : BaseSTOPregisterLSUI<asm # "l", GPR32, WZR,
+ !cast<Instruction>(instr # "W")>;
+ def : BaseSTOPregisterLSUI<asm # "l", GPR64, XZR,
+ !cast<Instruction>(instr # "X")>;
+ def : BaseSTOPregisterLSUI<asm # "al", GPR32, WZR,
+ !cast<Instruction>(instr # "W")>;
+ def : BaseSTOPregisterLSUI<asm # "al", GPR64, XZR,
+ !cast<Instruction>(instr # "X")>;
+ def : BaseSTOPregisterLSUI<asm, GPR32, WZR,
+ !cast<Instruction>(instr # "W")>;
+ def : BaseSTOPregisterLSUI<asm, GPR64, XZR,
+ !cast<Instruction>(instr # "X")>;
+}
+
class LoadStore64B_base<bits<3> opc, string asm_inst, string asm_ops,
dag iops, dag oops, list<dag> pat>
: I<oops, iops, asm_inst, asm_ops, "", pat>,
diff --git a/llvm/lib/Target/AArch64/AArch64InstrInfo.td b/llvm/lib/Target/AArch64/AArch64InstrInfo.td
index 325508b62a9f14..99e586d9953ece 100644
--- a/llvm/lib/Target/AArch64/AArch64InstrInfo.td
+++ b/llvm/lib/Target/AArch64/AArch64InstrInfo.td
@@ -213,6 +213,13 @@ def HasSMEF8F16 : Predicate<"Subtarget->isStreaming() && Subtarget->hasSMEF8
def HasSMEF8F32 : Predicate<"Subtarget->isStreaming() && Subtarget->hasSMEF8F32()">,
AssemblerPredicateWithAll<(all_of FeatureSMEF8F32), "sme-f8f32">;
+def HasPCDPHINT : Predicate<"Subtarget->hasPCDPHINT()">,
+ AssemblerPredicateWithAll<(all_of FeaturePCDPHINT), "pcdphint">;
+def HasLSUI : Predicate<"Subtarget->hasLSUI()">,
+ AssemblerPredicateWithAll<(all_of FeatureLSUI), "lsui">;
+def HasOCCMO : Predicate<"Subtarget->hasOCCMO()">,
+ AssemblerPredicateWithAll<(all_of FeatureOCCMO), "occmo">;
+
// A subset of SVE(2) instructions are legal in Streaming SVE execution mode,
// they should be enabled if either has been specified.
def HasSVEorSME
@@ -1231,6 +1238,11 @@ def : InstAlias<"sevl", (HINT 0b101)>;
def : InstAlias<"dgh", (HINT 0b110)>;
def : InstAlias<"esb", (HINT 0b10000)>, Requires<[HasRAS]>;
def : InstAlias<"csdb", (HINT 20)>;
+
+let Predicates = [HasPCDPHINT] in {
+ def STSHH: STSHHI;
+}
+
// In order to be able to write readable assembly, LLVM should accept assembly
// inputs that use Branch Target Indentification mnemonics, even with BTI disabled.
// However, in order to be compatible with other assemblers (e.g. GAS), LLVM
@@ -2568,12 +2580,59 @@ defm CASPA : CompareAndSwapPair<1, 0, "a">;
defm CASPL : CompareAndSwapPair<0, 1, "l">;
defm CASPAL : CompareAndSwapPair<1, 1, "al">;
+// v9.6-a atomic CAST
+let Predicates = [HasLSUI] in {
+defm CAST : CompareAndSwapUnprivileged<0b11, 0, 0, "">;
+defm CASLT : CompareAndSwapUnprivileged<0b11, 0, 1, "l">;
+defm CASAT : CompareAndSwapUnprivileged<0b11, 1, 0, "a">;
+defm CASALT : CompareAndSwapUnprivileged<0b11, 1, 1, "al">;
+
+// v9.6-a atomic CASPT
+defm CASPT : CompareAndSwapPairUnprivileged<0b01, 0, 0, "">;
+defm CASPLT : CompareAndSwapPairUnprivileged<0b01, 0, 1, "l">;
+defm CASPAT : CompareAndSwapPairUnprivileged<0b01, 1, 0, "a">;
+defm CASPALT : CompareAndSwapPairUnprivileged<0b01, 1, 1, "al">;
+}
+
// v8.1 atomic SWP
defm SWP : Swap<0, 0, "">;
defm SWPA : Swap<1, 0, "a">;
defm SWPL : Swap<0, 1, "l">;
defm SWPAL : Swap<1, 1, "al">;
+// v9.6a atomic swap (FEAT_LSUI)
+let Predicates = [HasLSUI] in {
+ defm SWPT : SwapLSUI<0, 0, "">;
+ defm SWPTA : SwapLSUI<1, 0, "a">;
+ defm SWPTL : SwapLSUI<0, 1, "l">;
+ defm SWPTAL : SwapLSUI<1, 1, "al">;
+}
+
+// v9.6-a unprivileged atomic LD<OP> (FEAT_LSUI)
+let Predicates = [HasLSUI] in {
+ defm LDTADD : LDOPregisterLSUI<0b000, "add", 0, 0, "">;
+ defm LDTADDA : LDOPregisterLSUI<0b000, "add", 1, 0, "a">;
+ defm LDTADDL : LDOPregisterLSUI<0b000, "add", 0, 1, "l">;
+ defm LDTADDAL : LDOPregisterLSUI<0b000, "add", 1, 1, "al">;
+
+ defm LDTCLR : LDOPregisterLSUI<0b001, "clr", 0, 0, "">;
+ defm LDTCLRA : LDOPregisterLSUI<0b001, "clr", 1, 0, "a">;
+ defm LDTCLRL : LDOPregisterLSUI<0b001, "clr", 0, 1, "l">;
+ defm LDTCLRAL : LDOPregisterLSUI<0b001, "clr", 1, 1, "al">;
+
+ defm LDTSET : LDOPregisterLSUI<0b011, "set", 0, 0, "">;
+ defm LDTSETA : LDOPregisterLSUI<0b011, "set", 1, 0, "a">;
+ defm LDTSETL : LDOPregisterLSUI<0b011, "set", 0, 1, "l">;
+ defm LDTSETAL : LDOPregisterLSUI<0b011, "set", 1, 1, "al">;
+
+ defm : STOPregisterLSUI<"sttadd","LDTADD">; // STTADDx
+ defm : STOPregisterLSUI<"sttclr","LDTCLR">; // STTCLRx
+ defm : STOPregisterLSUI<"sttset","LDTSET">; // STTSETx
+}
+
+// v9.6-a FEAT_RME_GPC3
+def APAS : APASI;
+
// v8.1 atomic LD<OP>(register). Performs load and then ST<OP>(register)
defm LDADD : LDOPregister<0b000, "add", 0, 0, "">;
defm LDADDA : LDOPregister<0b000, "add", 1, 0, "a">;
@@ -4020,6 +4079,33 @@ defm STNPD : StorePairNoAlloc<0b01, 1, FPR64Op, simm7s8, "stnp">;
defm STNPQ : StorePairNoAlloc<0b10, 1, FPR128Op, simm7s16, "stnp">;
}
+// Armv9.6-a Load/store no-allocate pair (FEAT_LSUI)
+let Predicates = [HasLSUI] in {
+ defm LDTP : LoadPairOffset<0b11, 0, GPR64z, simm7s8, "ldtp">;
+ def LDTPpre : LoadPairPreIdx<0b11, 0, GPR64z, simm7s8, "ldtp">;
+ def LDTPpost : LoadPairPostIdx<0b11, 0, GPR64z, simm7s8, "ldtp">;
+
+ defm STTNPX : StorePairNoAllocLSUI<0b11, 0, GPR64z, simm7s8, "sttnp">;
+ defm LDTNPX : LoadPairNoAllocLSUI<0b11, 0, GPR64z, simm7s8, "ldtnp">;
+
+ defm STTP : StorePairOffset<0b11, 0, GPR64z, simm7s8, "sttp">;
+ def STTPpre : StorePairPreIdx<0b11, 0, GPR64z, simm7s8, "sttp">;
+ def STTPpost : StorePairPostIdx<0b11, 0, GPR64z, simm7s8, "sttp">;
+}
+
+let Predicates = [HasLSUI, HasFPARMv8] in {
+ defm LDTPQ : LoadPairOffset<0b11, 1, FPR128Op, simm7s16, "ldtp">;
+ def LDTPQpre : LoadPairPreIdx<0b11, 1, FPR128Op, simm7s16, "ldtp">;
+ def LDTPQpost : LoadPairPostIdx<0b11, 1, FPR128Op, simm7s16, "ldtp">;
+
+ defm STTNPQ : StorePairNoAllocLSUI<0b11, 1, FPR128Op, simm7s16, "sttnp">;
+ defm LDTNPQ : LoadPairNoAllocLSUI<0b11, 1, FPR128Op, simm7s16, "ldtnp">;
+
+ defm STTPQ : StorePairOffset<0b11, 1, FPR128Op, simm7s16, "sttp">;
+ def STTPQpre : StorePairPreIdx<0b11, 1, FPR128Op, simm7s16, "sttp">;
+ def STTPQpost : StorePairPostIdx<0b11, 1, FPR128Op, simm7s16, "sttp">;
+}
+
def : Pat<(AArch64stp GPR64z:$Rt, GPR64z:$Rt2, (am_indexed7s64 GPR64sp:$Rn, simm7s8:$offset)),
(STPXi GPR64z:$Rt, GPR64z:$Rt2, GPR64sp:$Rn, simm7s8:$offset)>;
@@ -4660,6 +4746,21 @@ let Predicates = [HasLOR] in {
def STLLRH0 : InstAlias<"stllrh\t$Rt, [$Rn, #0]", (STLLRH GPR32: $Rt, GPR64sp:$Rn)>;
}
+// v9.6-a Unprivileged load store operations
+let Predicates = [HasLSUI] in {
+defm LDTXRW : LoadUnprivilegedLSUI<0b10, GPR32, "ldtxr">;
+defm LDTXRX : LoadUnprivilegedLSUI<0b11, GPR64, "ldtxr">;
+
+def LDATXRW : LoadExclusiveLSUI <0b10, 1, 1, GPR32, "ldatxr">;
+def LDATXRX : LoadExclusiveLSUI <0b11, 1, 1, GPR64, "ldatxr">;
+
+defm STTXRW : StoreUnprivilegedLSUI<0b10, GPR32, "sttxr">;
+defm STTXRX : StoreUnprivilegedLSUI<0b11, GPR64, "sttxr">;
+
+def STLTXRW : StoreExclusiveLSUI<0b10, 0, 1, GPR32, "stltxr">;
+def STLTXRX : StoreExclusiveLSUI<0b11, 0, 1, GPR64, "stltxr">;
+}
+
//===----------------------------------------------------------------------===//
// Scaled floating point to integer conversion instructions.
//===----------------------------------------------------------------------===//
diff --git a/llvm/lib/Target/AArch64/AArch64SystemOperands.td b/llvm/lib/Target/AArch64/AArch64SystemOperands.td
index dd0ce1cf47a792..804d1dc5bf6fd4 100644
--- a/llvm/lib/Target/AArch64/AArch64SystemOperands.td
+++ b/llvm/lib/Target/AArch64/AArch64SystemOperands.td
@@ -177,6 +177,17 @@ def : DC<"CIPAE", 0b100, 0b0111, 0b1110, 0b000>;
def : DC<"CIGDPAE", 0b100, 0b0111, 0b1110, 0b111>;
}
+let Requires = [{ {AArch64::FeatureOCCMO} }] in {
+// Outer cacheable CMO (FEAT_OCCMO)
+def : DC<"CIVAOC", 0b011, 0b0111, 0b1111, 0b000>;
+def : DC<"CVAOC", 0b011, 0b0111, 0b1011, 0b000>;
+}
+
+let Requires = [{ {AArch64::FeatureOCCMO, AArch64::FeatureMTE} }] in {
+def : DC<"CIGDVAOC", 0b011, 0b0111, 0b1111, 0b111>;
+def : DC<"CGDVAOC", 0b011, 0b0111, 0b1011, 0b111>;
+}
+
//===----------------------------------------------------------------------===//
// IC (instruction cache maintenance) instruction options.
//===----------------------------------------------------------------------===//
@@ -1970,3 +1981,59 @@ def : RWSysReg<"HACDBSCONS_EL2", 0b11, 0b100, 0b0010, 0b0011, 0b101>;
// v9.5a Fine Grained Write Trap EL3 (FEAT_FGWTE3)
// Op0 Op1 CRn CRm Op2
def : RWSysReg<"FGWTE3_EL3", 0b11, 0b110, 0b0001, 0b0001, 0b101>;
+
+//===----------------------------------------------------------------------===//
+// FEAT_SRMASK v9.6a registers
+//===----------------------------------------------------------------------===//
+def : RWSysReg<"SCTLRMASK_EL1", 0b11, 0b000, 0b0001, 0b0100, 0b000>;
+def : RWSysReg<"SCTLRMASK_EL2", 0b11, 0b100, 0b0001, 0b0100, 0b000>;
+def : RWSysReg<"SCTLRMASK_EL12", 0b11, 0b101, 0b0001, 0b0100, 0b000>;
+def : RWSysReg<"CPACRMASK_EL1", 0b11, 0b000, 0b0001, 0b0100, 0b010>;
+def : RWSysReg<"CPTRMASK_EL2", 0b11, 0b100, 0b0001, 0b0100, 0b010>;
+def : RWSysReg<"CPACRMASK_EL12", 0b11, 0b101, 0b0001, 0b0100, 0b010>;
+def : RWSysReg<"SCTLR2MASK_EL1", 0b11, 0b000, 0b0001, 0b0100, 0b011>;
+def : RWSysReg<"SCTLR2MASK_EL2", 0b11, 0b100, 0b0001, 0b0100, 0b011>;
+def : RWSysReg<"SCTLR2MASK_EL12", 0b11, 0b101, 0b0001, 0b0100, 0b011>;
+def : RWSysReg<"CPACRALIAS_EL1", 0b11, 0b000, 0b0001, 0b0100, 0b100>;
+def : RWSysReg<"SCTLRALIAS_EL1", 0b11, 0b000, 0b0001, 0b0100, 0b110>;
+def : RWSysReg<"SCTLR2ALIAS_EL1", 0b11, 0b000, 0b0001, 0b0100, 0b111>;
+def : RWSysReg<"TCRMASK_EL1", 0b11, 0b000, 0b0010, 0b0111, 0b010>;
+def : RWSysReg<"TCRMASK_EL2", 0b11, 0b100, 0b0010, 0b0111, 0b010>;
+def : RWSysReg<"TCRMASK_EL12", 0b11, 0b101, 0b0010, 0b0111, 0b010>;
+def : RWSysReg<"TCR2MASK_EL1", 0b11, 0b000, 0b0010, 0b0111, 0b011>;
+def : RWSysReg<"TCR2MASK_EL2", 0b11, 0b100, 0b0010, 0b0111, 0b011>;
+def : RWSysReg<"TCR2MASK_EL12", 0b11, 0b101, 0b0010, 0b0111, 0b011>;
+def : RWSysReg<"TCRALIAS_EL1", 0b11, 0b000, 0b0010, 0b0111, 0b110>;
+def : RWSysReg<"TCR2ALIAS_EL1", 0b11, 0b000, 0b0010, 0b0111, 0b111>;
+def : RWSysReg<"ACTLRMASK_EL1", 0b11, 0b000, 0b0001, 0b0100, 0b001>;
+def : RWSysReg<"ACTLRMASK_EL2", 0b11, 0b100, 0b0001, 0b0100, 0b001>;
+def : RWSysReg<"ACTLRMASK_EL12", 0b11, 0b101, 0b0001, 0b0100, 0b001>;
+def : RWSysReg<"ACTLRALIAS_EL1", 0b11, 0b000, 0b0001, 0b0100, 0b101>;
+
+//===----------------------------------------------------------------------===//
+// v9.6a PCDPHINT instruction options.
+//===----------------------------------------------------------------------===//
+
+class PHint<bits<2> op0, bits<3> op1, bits<4> crn, bits<4> crm,
+ bits<3> op2, string name> : SearchableTable {
+ let SearchableFields = ["Name", "Encoding"];
+ let EnumValueField = "Encoding";
+
+ string Name = name;
+ string AltName = name;
+ bits<16> Encoding;
+ let Encoding{15-14} = op0;
+ let Encoding{13-11} = op1;
+ let Encoding{10-7} = crn;
+ let Encoding{6-3} = crm;
+ let Encoding{2-0} = op2;
+ code Requires = [{ {} }];
+}
+
+let Requires = [{ {AArch64::FeaturePCDPHINT} }] in {
+ def KEEP : PHint<0b00, 0b000, 0b0000, 0b0000, 0b000, "keep">;
+ def STRM : PHint<0b00, 0b000, 0b0000, 0b0000, 0b001, "strm">;
+}
+
+// v9.6a Realm management extension enhancements
+def : RWSysReg<"GPCBW_EL3", 0b11, 0b110, 0b0010, 0b0001, 0b101>;
diff --git a/llvm/lib/Target/AArch64/AsmParser/AArch64AsmParser.cpp b/llvm/lib/Target/AArch64/AsmParser/AArch64AsmParser.cpp
index df69c20b1359fc..faa7856f95fb1a 100644
--- a/llvm/lib/Target/AArch64/AsmParser/AArch64AsmParser.cpp
+++ b/llvm/lib/Target/AArch64/AsmParser/AArch64AsmParser.cpp
@@ -286,6 +286,7 @@ class AArch64AsmParser : public MCTargetAsmParser {
ParseStatus tryParseSVEVecLenSpecifier(OperandVector &Operands);
ParseStatus tryParseGPR64x8(OperandVector &Operands);
ParseStatus tryParseImmRange(OperandVector &Operands);
+ ParseStatus tryParsePHintInstOperand(OperandVector &Operands);
public:
enum AArch64MatchResultTy {
@@ -361,6 +362,7 @@ class AArch64Operand : public MCParsedAsmOperand {
k_FPImm,
k_Barrier,
k_PSBHint,
+ k_PHint,
k_BTIHint,
} Kind;
@@ -481,7 +483,11 @@ class AArch64Operand : public MCParsedAsmOperand {
unsigned Length;
unsigned Val;
};
-
+ struct PHintOp {
+ const char *Data;
+ unsigned Length;
+ unsigned Val;
+ };
struct BTIHintOp {
const char *Data;
unsigned Length;
@@ -511,6 +517,7 @@ class AArch64Operand : public MCParsedAsmOperand {
struct SysCRImmOp SysCRImm;
struct PrefetchOp Prefetch;
struct PSBHintOp PSBHint;
+ struct PHintOp PHint;
struct BTIHintOp BTIHint;
struct ShiftExtendOp ShiftExtend;
struct SVCROp SVCR;
@@ -576,6 +583,9 @@ class AArch64Operand : public MCParsedAsmOperand {
case k_PSBHint:
PSBHint = o.PSBHint;
break;
+ case k_PHint:
+ PHint = o.PHint;
+ break;
case k_BTIHint:
BTIHint = o.BTIHint;
break;
@@ -728,11 +738,21 @@ class AArch64Operand : public MCParsedAsmOperand {
return PSBHint.Val;
}
+ unsigned getPHint() const {
+ assert(Kind == k_PHint && "Invalid access!");
+ return PHint.Val;
+ }
+
StringRef getPSBHintName() const {
assert(Kind == k_PSBHint && "Invalid access!");
return StringRef(PSBHint.Data, PSBHint.Length);
}
+ StringRef getPHintName() const {
+ assert(Kind == k_PHint && "Invalid access!");
+ return StringRef(PHint.Data, PHint.Length);
+ }
+
unsigned getBTIHint() const {
assert(Kind == k_BTIHint && "Invalid access!");
return BTIHint.Val;
@@ -1484,6 +1504,7 @@ class AArch64Operand : public MCParsedAsmOperand {
bool isSysCR() const { return Kind == k_SysCR; }
bool isPrefetch() const { return Kind == k_Prefetch; }
bool isPSBHint() const { return Kind == k_PSBHint; }
+ bool isPHint() const { return Kind == k_PHint; }
bool isBTIHint() const { return Kind == k_BTIHint; }
bool isShiftExtend() const { return Kind == k_ShiftExtend; }
bool isShifter() const {
@@ -2143,6 +2164,11 @@ class AArch64Operand : public MCParsedAsmOperand {
Inst.addOperand(MCOperand::createImm(getPSBHint()));
}
+ void addPHintOperands(MCInst &Inst, unsigned N) const {
+ assert(N == 1 && "Invalid number of operands!");
+ Inst.addOperand(MCOperand::createImm(getPHint()));
+ }
+
void addBTIHintOperands(MCInst &Inst, unsigned N) const {
assert(N == 1 && "Invalid number of operands!");
Inst.addOperand(MCOperand::createImm(getBTIHint()));
@@ -2440,6 +2466,17 @@ class AArch64Operand : public MCParsedAsmOperand {
return Op;
}
+ static std::unique_ptr<AArch64Operand>
+ CreatePHintInst(unsigned Val, StringRef Str, SMLoc S, MCContext &Ctx) {
+ auto Op = std::make_unique<AArch64Operand>(k_PHint, Ctx);
+ Op->PHint.Val = Val;
+ Op->PHint.Data = Str.data();
+ Op->PHint.Length = Str.size();
+ Op->StartLoc = S;
+ Op->EndLoc = S;
+ return Op;
+ }
+
static std::unique_ptr<AArch64Operand> CreateSysCR(unsigned Val, SMLoc S,
SMLoc E, MCContext &Ctx) {
auto Op = std::make_unique<AArch64Operand>(k_SysCR, Ctx);
@@ -2592,6 +2629,9 @@ void AArch64Operand::print(raw_ostream &OS) const {
case k_PSBHint:
OS << getPSBHintName();
break;
+ case k_PHint:
+ OS << getPHintName();
+ break;
case k_BTIHint:
OS << getBTIHintName();
break;
@@ -3736,6 +3776,8 @@ static const struct Extension {
{"sme-fa64", {AArch64::FeatureSMEFA64}},
{"cpa", {AArch64::FeatureCPA}},
{"tlbiw", {AArch64::FeatureTLBIW}},
+ {"lsui", {AArch64::FeatureLSUI}},
+ {"occmo", {AArch64::FeatureOCCMO}},
};
static void setRequiredFeatureString(FeatureBitset FBS, std::string &Str) {
@@ -4112,6 +4154,23 @@ ParseStatus AArch64AsmParser::tryParseSysReg(OperandVector &Operands) {
return ParseStatus::Success;
}
+ParseStatus
+AArch64AsmParser::tryParsePHintInstOperand(OperandVector &Operands) {
+ SMLoc S = getLoc();
+ const AsmToken &Tok = getTok();
+ if (Tok.isNot(AsmToken::Identifier))
+ return TokError("invalid operand for instruction");
+
+ auto PH = AArch64PHint::lookupPHintByName(Tok.getString());
+ if (!PH)
+ return TokError("invalid operand for instruction");
+
+ Operands.push_back(AArch64Operand::CreatePHintInst(
+ PH->Encoding, Tok.getString(), S, getContext()));
+ Lex(); // Eat identifier token.
+ return ParseStatus::Success;
+}
+
/// tryParseNeonVectorRegister - Parse a vector register operand.
bool AArch64AsmParser::tryParseNeonVectorRegister(OperandVector &Operands) {
if (getTok().isNot(AsmToken::Identifier))
diff --git a/llvm/lib/Target/AArch64/Disassembler/AArch64Disassembler.cpp b/llvm/lib/Target/AArch64/Disassembler/AArch64Disassembler.cpp
index b97f00c9931122..85933754dae4aa 100644
--- a/llvm/lib/Target/AArch64/Disassembler/AArch64Disassembler.cpp
+++ b/llvm/lib/Target/AArch64/Disassembler/AArch64Disassembler.cpp
@@ -1114,6 +1114,14 @@ static DecodeStatus DecodePairLdStInstruction(MCInst &Inst, uint32_t insn,
case AArch64::STPSpre:
case AArch64::STGPpre:
case AArch64::STGPpost:
+ case AArch64::LDTPpre:
+ case AArch64::LDTPpost:
+ case AArch64::LDTPQpost:
+ case AArch64::LDTPQpre:
+ case AArch64::STTPpost:
+ case AArch64::STTPpre:
+ case AArch64::STTPQpost:
+ case AArch64::STTPQpre:
DecodeSimpleRegisterClass<AArch64::GPR64spRegClassID, 0, 32>(Inst, Rn, Addr,
Decoder);
break;
@@ -1130,6 +1138,10 @@ static DecodeStatus DecodePairLdStInstruction(MCInst &Inst, uint32_t insn,
case AArch64::LDPSWpre:
case AArch64::STGPpre:
case AArch64::STGPpost:
+ case AArch64::LDTPpost:
+ case AArch64::LDTPpre:
+ case AArch64::STTPpost:
+ case AArch64::STTPpre:
NeedsDisjointWritebackTransfer = true;
[[fallthrough]];
case AArch64::LDNPXi:
@@ -1138,6 +1150,10 @@ static DecodeStatus DecodePairLdStInstruction(MCInst &Inst, uint32_t insn,
case AArch64::STPXi:
case AArch64::LDPSWi:
case AArch64::STGPi:
+ case AArch64::LDTPi:
+ case AArch64::STTPi:
+ case AArch64::STTNPXi:
+ case AArch64::LDTNPXi:
DecodeSimpleRegisterClass<AArch64::GPR64RegClassID, 0, 32>(Inst, Rt, Addr,
Decoder);
DecodeSimpleRegisterClass<AArch64::GPR64RegClassID, 0, 32>(Inst, Rt2, Addr,
@@ -1166,6 +1182,14 @@ static DecodeStatus DecodePairLdStInstruction(MCInst &Inst, uint32_t insn,
case AArch64::STPQi:
case AArch64::LDPQpre:
case AArch64::STPQpre:
+ case AArch64::LDTPQi:
+ case AArch64::LDTPQpost:
+ case AArch64::LDTPQpre:
+ case AArch64::LDTNPQi:
+ case AArch64::STTPQi:
+ case AArch64::STTPQpost:
+ case AArch64::STTPQpre:
+ case AArch64::STTNPQi:
DecodeSimpleRegisterClass<AArch64::FPR128RegClassID, 0, 32>(Inst, Rt, Addr,
Decoder);
DecodeSimpleRegisterClass<AArch64::FPR128RegClassID, 0, 32>(Inst, Rt2, Addr,
diff --git a/llvm/lib/Target/AArch64/MCTargetDesc/AArch64InstPrinter.cpp b/llvm/lib/Target/AArch64/MCTargetDesc/AArch64InstPrinter.cpp
index 7c9113f6bc2380..762a7af8c3ddb3 100644
--- a/llvm/lib/Target/AArch64/MCTargetDesc/AArch64InstPrinter.cpp
+++ b/llvm/lib/Target/AArch64/MCTargetDesc/AArch64InstPrinter.cpp
@@ -988,6 +988,22 @@ bool AArch64InstPrinter::printSysAlias(const MCInst *MI,
Name = std::string(AT->Name);
}
break;
+ // Overlaps with AT and DC
+ case 15: {
+ const AArch64AT::AT *AT = AArch64AT::lookupATByEncoding(Encoding);
+ const AArch64DC::DC *DC = AArch64DC::lookupDCByEncoding(Encoding);
+ if (AT && AT->haveFeatures(STI.getFeatureBits())) {
+ NeedsReg = true;
+ Ins = "at\t";
+ Name = std::string(AT->Name);
+ } else if (DC && DC->haveFeatures(STI.getFeatureBits())) {
+ NeedsReg = true;
+ Ins = "dc\t";
+ Name = std::string(DC->Name);
+ } else {
+ return false;
+ }
+ } break;
}
} else if (CnVal == 8 || CnVal == 9) {
// TLBI aliases
@@ -2125,3 +2141,14 @@ void AArch64InstPrinter::printSyspXzrPair(const MCInst *MI, unsigned OpNum,
"MC representation of SyspXzrPair should be XZR");
O << getRegisterName(Reg) << ", " << getRegisterName(Reg);
}
+
+void AArch64InstPrinter::printPHintOp(const MCInst *MI, unsigned OpNum,
+ const MCSubtargetInfo &STI,
+ raw_ostream &O) {
+ unsigned Op = MI->getOperand(OpNum).getImm();
+ auto PH = AArch64PHint::lookupPHintByEncoding(Op);
+ if (PH)
+ O << PH->Name;
+ else
+ markup(O, Markup::Immediate) << '#' << formatImm(Op);
+}
diff --git a/llvm/lib/Target/AArch64/MCTargetDesc/AArch64InstPrinter.h b/llvm/lib/Target/AArch64/MCTargetDesc/AArch64InstPrinter.h
index 9dccdf42361b21..e7b62b3203681b 100644
--- a/llvm/lib/Target/AArch64/MCTargetDesc/AArch64InstPrinter.h
+++ b/llvm/lib/Target/AArch64/MCTargetDesc/AArch64InstPrinter.h
@@ -236,6 +236,8 @@ class AArch64InstPrinter : public MCInstPrinter {
template <unsigned ImmIs0, unsigned ImmIs1>
void printExactFPImm(const MCInst *MI, unsigned OpNum,
const MCSubtargetInfo &STI, raw_ostream &O);
+ void printPHintOp(const MCInst *MI, unsigned OpNum,
+ const MCSubtargetInfo &STI, raw_ostream &O);
};
class AArch64AppleInstPrinter : public AArch64InstPrinter {
diff --git a/llvm/lib/Target/AArch64/Utils/AArch64BaseInfo.cpp b/llvm/lib/Target/AArch64/Utils/AArch64BaseInfo.cpp
index a742c406537bee..59937a7d2a1f68 100644
--- a/llvm/lib/Target/AArch64/Utils/AArch64BaseInfo.cpp
+++ b/llvm/lib/Target/AArch64/Utils/AArch64BaseInfo.cpp
@@ -132,6 +132,13 @@ namespace llvm {
}
}
+namespace llvm {
+namespace AArch64PHint {
+#define GET_PHINT_IMPL
+#include "AArch64GenSystemOperands.inc"
+} // namespace AArch64PHint
+} // namespace llvm
+
namespace llvm {
namespace AArch64BTIHint {
#define GET_BTI_IMPL
diff --git a/llvm/lib/Target/AArch64/Utils/AArch64BaseInfo.h b/llvm/lib/Target/AArch64/Utils/AArch64BaseInfo.h
index 9faecccb1bd104..8f34cf054fe286 100644
--- a/llvm/lib/Target/AArch64/Utils/AArch64BaseInfo.h
+++ b/llvm/lib/Target/AArch64/Utils/AArch64BaseInfo.h
@@ -582,6 +582,26 @@ namespace AArch64PSBHint {
#include "AArch64GenSystemOperands.inc"
}
+namespace AArch64PHint {
+struct PHint {
+ const char *Name;
+ const char *AltName;
+ unsigned Encoding;
+ FeatureBitset FeaturesRequired;
+
+ bool haveFeatures(FeatureBitset ActiveFeatures) const {
+ return ActiveFeatures[llvm::AArch64::FeatureAll] ||
+ (FeaturesRequired & ActiveFeatures) == FeaturesRequired;
+ }
+};
+
+#define GET_PHINT_DECL
+#include "AArch64GenSystemOperands.inc"
+
+const PHint *lookupPHintByName(StringRef);
+const PHint *lookupPHintByEncoding(uint16_t);
+} // namespace AArch64PHint
+
namespace AArch64BTIHint {
struct BTI : SysAlias {
using SysAlias::SysAlias;
diff --git a/llvm/test/MC/AArch64/armv9.6a-lsui.s b/llvm/test/MC/AArch64/armv9.6a-lsui.s
new file mode 100644
index 00000000000000..d366bdfa695e4b
--- /dev/null
+++ b/llvm/test/MC/AArch64/armv9.6a-lsui.s
@@ -0,0 +1,395 @@
+# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
+// RUN: llvm-mc -triple aarch64 -mattr=+lsui -show-encoding %s | FileCheck %s
+
+_func:
+//------------------------------------------------------------------------------
+// Unprivileged load/store operations
+//------------------------------------------------------------------------------
+ ldtxr x9, [sp]
+ ldtxr x9, [sp, #0]
+ ldtxr x10, [x11]
+ ldtxr x10, [x11, #0]
+
+ ldatxr x9, [sp]
+ ldatxr x10, [x11]
+
+ sttxr wzr, w4, [sp]
+ sttxr wzr, w4, [sp, #0]
+ sttxr w5, x6, [x7]
+ sttxr w5, x6, [x7, #0]
+
+ stltxr w2, w4, [sp]
+ stltxr w5, x6, [x7]
+
+//------------------------------------------------------------------------------
+// Unprivileged load/store register pair (offset)
+//------------------------------------------------------------------------------
+
+ ldtp x21, x29, [x2, #504]
+ ldtp x22, x23, [x3, #-512]
+ ldtp x24, x25, [x4, #8]
+
+ sttp x3, x5, [sp], #16
+ sttp x3, x5, [sp, #8]!
+
+ sttp q3, q5, [sp]
+ sttp q17, q19, [sp, #1008]
+
+//------------------------------------------------------------------------------
+// Load/store register pair (post-indexed)
+//------------------------------------------------------------------------------
+
+ ldtp x21, x29, [x2], #504
+ ldtp x22, x23, [x3], #-512
+ ldtp x24, x25, [x4], #8
+
+ sttp q3, q5, [sp], #0
+ sttp q17, q19, [sp], #1008
+ ldtp q23, q29, [x1], #-1024
+
+//------------------------------------------------------------------------------
+// Load/store register pair (pre-indexed)
+//------------------------------------------------------------------------------
+ ldtp x21, x29, [x2, #504]!
+ ldtp x22, x23, [x3, #-512]!
+ ldtp x24, x25, [x4, #8]!
+
+ sttp q3, q5, [sp, #0]!
+ sttp q17, q19, [sp, #1008]!
+ ldtp q23, q29, [x1, #-1024]!
+
+//------------------------------------------------------------------------------
+// CAS(P)T instructions
+//------------------------------------------------------------------------------
+ //64 bits
+ cast x0, x1, [x2]
+ cast x0, x1, [sp, #0]
+ casat x0, x1, [x2]
+ casat x0, x1, [sp, #0]
+ casalt x0, x1, [x2]
+ casalt x0, x1, [sp, #0]
+ caslt x0, x1, [x2]
+ caslt x0, x1, [sp, #0]
+
+ //CASP instruction
+ caspt x0, x1, x2, x3, [x4]
+ caspt x0, x1, x2, x3, [sp, #0]
+ caspat x0, x1, x2, x3, [x4]
+ caspat x0, x1, x2, x3, [sp, #0]
+ casplt x0, x1, x2, x3, [x4]
+ casplt x0, x1, x2, x3, [sp, #0]
+ caspalt x0, x1, x2, x3, [x4]
+ caspalt x0, x1, x2, x3, [sp, #0]
+
+//------------------------------------------------------------------------------
+// SWP(A|L)T instructions
+//------------------------------------------------------------------------------
+ swpt w7, wzr, [x5]
+ swpt x9, xzr, [sp]
+
+ swpta w7, wzr, [x5]
+ swpta x9, xzr, [sp]
+
+ swptl w7, wzr, [x5]
+ swptl x9, xzr, [sp]
+
+ swptal w7, wzr, [x5]
+ swptal x9, xzr, [sp]
+
+//------------------------------------------------------------------------------
+// LD{ADD|CLR|SET)(A|L|AL)T instructions
+//------------------------------------------------------------------------------
+
+ ldtadd w7, wzr, [x5]
+ ldtadd x9, xzr, [sp]
+
+ ldtadda w7, wzr, [x5]
+ ldtadda x9, xzr, [sp]
+
+ ldtaddl w7, wzr, [x5]
+ ldtaddl x9, xzr, [sp]
+
+ ldtaddal w7, wzr, [x5]
+ ldtaddal x9, xzr, [sp]
+
+ ldtclr w7, wzr, [x5]
+ ldtclr x9, xzr, [sp]
+
+ ldtclrl w7, wzr, [x5]
+ ldtclrl x9, xzr, [sp]
+
+ ldtclra w7, wzr, [x5]
+ ldtclra x9, xzr, [sp]
+
+ ldtclral w7, wzr, [x5]
+ ldtclral x9, xzr, [sp]
+
+ ldtset w7, wzr, [x5]
+ ldtset x9, xzr, [sp]
+
+ ldtsetl w7, wzr, [x5]
+ ldtsetl x9, xzr, [sp]
+
+ ldtseta w7, wzr, [x5]
+ ldtseta x9, xzr, [sp]
+
+ ldtsetal w7, wzr, [x5]
+ ldtsetal x9, xzr, [sp]
+
+//------------------------------------------------------------------------------
+// ST{ADD|CLR|SET)(A|L|AL)T instructions
+//------------------------------------------------------------------------------
+
+ sttadd w0, [x2]
+ sttadd w2, [sp]
+ sttadd x0, [x2]
+ sttadd x2, [sp]
+
+ sttaddl w0, [x2]
+ sttaddl w2, [sp]
+ sttaddl x0, [x2]
+ sttaddl x2, [sp]
+
+ sttadda w0, [x2]
+ sttadda w2, [sp]
+ sttadda x0, [x2]
+ sttadda x2, [sp]
+
+ sttaddal w0, [x2]
+ sttaddal w2, [sp]
+ sttaddal x0, [x2]
+ sttaddal x2, [sp]
+
+ sttclr w0, [x2]
+ sttclr w2, [sp]
+ sttclr x0, [x2]
+ sttclr x2, [sp]
+
+ sttclra w0, [x2]
+ sttclra w2, [sp]
+ sttclra x0, [x2]
+ sttclra x2, [sp]
+
+ sttclrl w0, [x2]
+ sttclrl w2, [sp]
+ sttclrl x0, [x2]
+ sttclrl x2, [sp]
+
+ sttclral w0, [x2]
+ sttclral x2, [sp]
+ sttclral x0, [x2]
+ sttclral x2, [sp]
+
+ sttset w0, [x2]
+ sttset w2, [sp]
+ sttset x0, [x2]
+ sttset x2, [sp]
+
+ sttseta w0, [x2]
+ sttseta w2, [sp]
+ sttseta x0, [x2]
+ sttseta x2, [sp]
+
+ sttsetl w0, [x2]
+ sttsetl w2, [sp]
+ sttsetl x0, [x2]
+ sttsetl x2, [sp]
+
+ sttsetal w0, [x2]
+ sttsetal x2, [sp]
+ sttsetal x0, [x2]
+ sttsetal x2, [sp]
+
+//------------------------------------------------------------------------------
+// Load/store non-temporal register pair (offset)
+//------------------------------------------------------------------------------
+ ldtnp x21, x29, [x2, #504]
+ ldtnp x22, x23, [x3, #-512]
+ ldtnp x24, x25, [x4, #8]
+ ldtnp q23, q29, [x1, #-1024]
+
+ sttnp x3, x5, [sp]
+ sttnp x17, x19, [sp, #64]
+ sttnp q3, q5, [sp]
+ sttnp q17, q19, [sp, #1008]
+
+# CHECK: .text
+
+# CHECK: _func:
+# CHECK-NEXT: ldtxr x9, [sp] // encoding: [0xe9,0x7f,0x5f,0xc9]
+# CHECK-NEXT: ldtxr x9, [sp] // encoding: [0xe9,0x7f,0x5f,0xc9]
+# CHECK-NEXT: ldtxr x10, [x11] // encoding: [0x6a,0x7d,0x5f,0xc9]
+# CHECK-NEXT: ldtxr x10, [x11] // encoding: [0x6a,0x7d,0x5f,0xc9]
+
+# CHECK: ldatxr x9, [sp] // encoding: [0xe9,0xff,0x5f,0xc9]
+# CHECK-NEXT: ldatxr x10, [x11] // encoding: [0x6a,0xfd,0x5f,0xc9]
+
+# CHECK: sttxr wzr, w4, [sp] // encoding: [0xe4,0x7f,0x1f,0x89]
+# CHECK-NEXT: sttxr wzr, w4, [sp] // encoding: [0xe4,0x7f,0x1f,0x89]
+# CHECK-NEXT: sttxr w5, x6, [x7] // encoding: [0xe6,0x7c,0x05,0xc9]
+# CHECK-NEXT: sttxr w5, x6, [x7] // encoding: [0xe6,0x7c,0x05,0xc9]
+
+# CHECK: stltxr w2, w4, [sp] // encoding: [0xe4,0xff,0x02,0x89]
+# CHECK-NEXT: stltxr w5, x6, [x7] // encoding: [0xe6,0xfc,0x05,0xc9]
+
+# CHECK: ldtp x21, x29, [x2, #504] // encoding: [0x55,0xf4,0x5f,0xe9]
+# CHECK-NEXT: ldtp x22, x23, [x3, #-512] // encoding: [0x76,0x5c,0x60,0xe9]
+# CHECK-NEXT: ldtp x24, x25, [x4, #8] // encoding: [0x98,0xe4,0x40,0xe9]
+
+# CHECK: sttp x3, x5, [sp], #16 // encoding: [0xe3,0x17,0x81,0xe8]
+# CHECK-NEXT: sttp x3, x5, [sp, #8]! // encoding: [0xe3,0x97,0x80,0xe9]
+
+# CHECK: sttp q3, q5, [sp] // encoding: [0xe3,0x17,0x00,0xed]
+# CHECK-NEXT: sttp q17, q19, [sp, #1008] // encoding: [0xf1,0xcf,0x1f,0xed]
+
+# CHECK: ldtp x21, x29, [x2], #504 // encoding: [0x55,0xf4,0xdf,0xe8]
+# CHECK-NEXT: ldtp x22, x23, [x3], #-512 // encoding: [0x76,0x5c,0xe0,0xe8]
+# CHECK-NEXT: ldtp x24, x25, [x4], #8 // encoding: [0x98,0xe4,0xc0,0xe8]
+
+# CHECK: sttp q3, q5, [sp], #0 // encoding: [0xe3,0x17,0x80,0xec]
+# CHECK-NEXT: sttp q17, q19, [sp], #1008 // encoding: [0xf1,0xcf,0x9f,0xec]
+# CHECK-NEXT: ldtp q23, q29, [x1], #-1024 // encoding: [0x37,0x74,0xe0,0xec]
+
+# CHECK: ldtp x21, x29, [x2, #504]! // encoding: [0x55,0xf4,0xdf,0xe9]
+# CHECK-NEXT: ldtp x22, x23, [x3, #-512]! // encoding: [0x76,0x5c,0xe0,0xe9]
+# CHECK-NEXT: ldtp x24, x25, [x4, #8]! // encoding: [0x98,0xe4,0xc0,0xe9]
+
+# CHECK: sttp q3, q5, [sp, #0]! // encoding: [0xe3,0x17,0x80,0xed]
+# CHECK-NEXT: sttp q17, q19, [sp, #1008]! // encoding: [0xf1,0xcf,0x9f,0xed]
+# CHECK-NEXT: ldtp q23, q29, [x1, #-1024]! // encoding: [0x37,0x74,0xe0,0xed]
+
+# CHECK: cast x0, x1, [x2] // encoding: [0x41,0x7c,0x80,0xc9]
+# CHECK-NEXT: cast x0, x1, [sp] // encoding: [0xe1,0x7f,0x80,0xc9]
+# CHECK-NEXT: casat x0, x1, [x2] // encoding: [0x41,0x7c,0xc0,0xc9]
+# CHECK-NEXT: casat x0, x1, [sp] // encoding: [0xe1,0x7f,0xc0,0xc9]
+# CHECK-NEXT: casalt x0, x1, [x2] // encoding: [0x41,0xfc,0xc0,0xc9]
+# CHECK-NEXT: casalt x0, x1, [sp] // encoding: [0xe1,0xff,0xc0,0xc9]
+# CHECK-NEXT: caslt x0, x1, [x2] // encoding: [0x41,0xfc,0x80,0xc9]
+# CHECK-NEXT: caslt x0, x1, [sp] // encoding: [0xe1,0xff,0x80,0xc9]
+
+# CHECK: caspt x0, x1, x2, x3, [x4] // encoding: [0x82,0x7c,0x80,0x49]
+# CHECK-NEXT: caspt x0, x1, x2, x3, [sp] // encoding: [0xe2,0x7f,0x80,0x49]
+# CHECK-NEXT: caspat x0, x1, x2, x3, [x4] // encoding: [0x82,0x7c,0xc0,0x49]
+# CHECK-NEXT: caspat x0, x1, x2, x3, [sp] // encoding: [0xe2,0x7f,0xc0,0x49]
+# CHECK-NEXT: casplt x0, x1, x2, x3, [x4] // encoding: [0x82,0xfc,0x80,0x49]
+# CHECK-NEXT: casplt x0, x1, x2, x3, [sp] // encoding: [0xe2,0xff,0x80,0x49]
+# CHECK-NEXT: caspalt x0, x1, x2, x3, [x4] // encoding: [0x82,0xfc,0xc0,0x49]
+# CHECK-NEXT: caspalt x0, x1, x2, x3, [sp] // encoding: [0xe2,0xff,0xc0,0x49]
+
+# CHECK: swpt w7, wzr, [x5] // encoding: [0xbf,0x84,0x27,0x19]
+# CHECK-NEXT: swpt x9, xzr, [sp] // encoding: [0xff,0x87,0x29,0x59]
+
+# CHECK: swpta w7, wzr, [x5] // encoding: [0xbf,0x84,0xa7,0x19]
+# CHECK-NEXT: swpta x9, xzr, [sp] // encoding: [0xff,0x87,0xa9,0x59]
+
+# CHECK: swptl w7, wzr, [x5] // encoding: [0xbf,0x84,0x67,0x19]
+# CHECK-NEXT: swptl x9, xzr, [sp] // encoding: [0xff,0x87,0x69,0x59]
+
+# CHECK: swptal w7, wzr, [x5] // encoding: [0xbf,0x84,0xe7,0x19]
+# CHECK-NEXT: swptal x9, xzr, [sp] // encoding: [0xff,0x87,0xe9,0x59]
+
+# CHECK: ldtadd w7, wzr, [x5] // encoding: [0xbf,0x04,0x27,0x19]
+# CHECK-NEXT: ldtadd x9, xzr, [sp] // encoding: [0xff,0x07,0x29,0x59]
+
+# CHECK: ldtadda w7, wzr, [x5] // encoding: [0xbf,0x04,0xa7,0x19]
+# CHECK-NEXT: ldtadda x9, xzr, [sp] // encoding: [0xff,0x07,0xa9,0x59]
+
+# CHECK: ldtaddl w7, wzr, [x5] // encoding: [0xbf,0x04,0x67,0x19]
+# CHECK-NEXT: ldtaddl x9, xzr, [sp] // encoding: [0xff,0x07,0x69,0x59]
+
+# CHECK: ldtaddal w7, wzr, [x5] // encoding: [0xbf,0x04,0xe7,0x19]
+# CHECK-NEXT: ldtaddal x9, xzr, [sp] // encoding: [0xff,0x07,0xe9,0x59]
+
+# CHECK: ldtclr w7, wzr, [x5] // encoding: [0xbf,0x14,0x27,0x19]
+# CHECK-NEXT: ldtclr x9, xzr, [sp] // encoding: [0xff,0x17,0x29,0x59]
+
+# CHECK: ldtclrl w7, wzr, [x5] // encoding: [0xbf,0x14,0x67,0x19]
+# CHECK-NEXT: ldtclrl x9, xzr, [sp] // encoding: [0xff,0x17,0x69,0x59]
+
+# CHECK: ldtclra w7, wzr, [x5] // encoding: [0xbf,0x14,0xa7,0x19]
+# CHECK-NEXT: ldtclra x9, xzr, [sp] // encoding: [0xff,0x17,0xa9,0x59]
+
+# CHECK: ldtclral w7, wzr, [x5] // encoding: [0xbf,0x14,0xe7,0x19]
+# CHECK-NEXT: ldtclral x9, xzr, [sp] // encoding: [0xff,0x17,0xe9,0x59]
+
+# CHECK: ldtset w7, wzr, [x5] // encoding: [0xbf,0x34,0x27,0x19]
+# CHECK-NEXT: ldtset x9, xzr, [sp] // encoding: [0xff,0x37,0x29,0x59]
+
+# CHECK: ldtsetl w7, wzr, [x5] // encoding: [0xbf,0x34,0x67,0x19]
+# CHECK-NEXT: ldtsetl x9, xzr, [sp] // encoding: [0xff,0x37,0x69,0x59]
+
+# CHECK: ldtseta w7, wzr, [x5] // encoding: [0xbf,0x34,0xa7,0x19]
+# CHECK-NEXT: ldtseta x9, xzr, [sp] // encoding: [0xff,0x37,0xa9,0x59]
+
+# CHECK: ldtsetal w7, wzr, [x5] // encoding: [0xbf,0x34,0xe7,0x19]
+# CHECK-NEXT: ldtsetal x9, xzr, [sp] // encoding: [0xff,0x37,0xe9,0x59]
+
+# CHECK: ldtadd w0, wzr, [x2] // encoding: [0x5f,0x04,0x20,0x19]
+# CHECK-NEXT: ldtadd w2, wzr, [sp] // encoding: [0xff,0x07,0x22,0x19]
+# CHECK-NEXT: ldtadd x0, xzr, [x2] // encoding: [0x5f,0x04,0x20,0x59]
+# CHECK-NEXT: ldtadd x2, xzr, [sp] // encoding: [0xff,0x07,0x22,0x59]
+
+# CHECK: ldtadd w0, wzr, [x2] // encoding: [0x5f,0x04,0x20,0x19]
+# CHECK-NEXT: ldtadd w2, wzr, [sp] // encoding: [0xff,0x07,0x22,0x19]
+# CHECK-NEXT: ldtadd x0, xzr, [x2] // encoding: [0x5f,0x04,0x20,0x59]
+# CHECK-NEXT: ldtadd x2, xzr, [sp] // encoding: [0xff,0x07,0x22,0x59]
+
+# CHECK: ldtadd w0, wzr, [x2] // encoding: [0x5f,0x04,0x20,0x19]
+# CHECK-NEXT: ldtadd w2, wzr, [sp] // encoding: [0xff,0x07,0x22,0x19]
+# CHECK-NEXT: ldtadd x0, xzr, [x2] // encoding: [0x5f,0x04,0x20,0x59]
+# CHECK-NEXT: ldtadd x2, xzr, [sp] // encoding: [0xff,0x07,0x22,0x59]
+
+# CHECK: ldtadd w0, wzr, [x2] // encoding: [0x5f,0x04,0x20,0x19]
+# CHECK-NEXT: ldtadd w2, wzr, [sp] // encoding: [0xff,0x07,0x22,0x19]
+# CHECK-NEXT: ldtadd x0, xzr, [x2] // encoding: [0x5f,0x04,0x20,0x59]
+# CHECK-NEXT: ldtadd x2, xzr, [sp] // encoding: [0xff,0x07,0x22,0x59]
+
+# CHECK: ldtclr w0, wzr, [x2] // encoding: [0x5f,0x14,0x20,0x19]
+# CHECK-NEXT: ldtclr w2, wzr, [sp] // encoding: [0xff,0x17,0x22,0x19]
+# CHECK-NEXT: ldtclr x0, xzr, [x2] // encoding: [0x5f,0x14,0x20,0x59]
+# CHECK-NEXT: ldtclr x2, xzr, [sp] // encoding: [0xff,0x17,0x22,0x59]
+
+# CHECK: ldtclr w0, wzr, [x2] // encoding: [0x5f,0x14,0x20,0x19]
+# CHECK-NEXT: ldtclr w2, wzr, [sp] // encoding: [0xff,0x17,0x22,0x19]
+# CHECK-NEXT: ldtclr x0, xzr, [x2] // encoding: [0x5f,0x14,0x20,0x59]
+# CHECK-NEXT: ldtclr x2, xzr, [sp] // encoding: [0xff,0x17,0x22,0x59]
+
+# CHECK: ldtclr w0, wzr, [x2] // encoding: [0x5f,0x14,0x20,0x19]
+# CHECK-NEXT: ldtclr w2, wzr, [sp] // encoding: [0xff,0x17,0x22,0x19]
+# CHECK-NEXT: ldtclr x0, xzr, [x2] // encoding: [0x5f,0x14,0x20,0x59]
+# CHECK-NEXT: ldtclr x2, xzr, [sp] // encoding: [0xff,0x17,0x22,0x59]
+
+# CHECK: ldtclr w0, wzr, [x2] // encoding: [0x5f,0x14,0x20,0x19]
+# CHECK-NEXT: ldtclr x2, xzr, [sp] // encoding: [0xff,0x17,0x22,0x59]
+# CHECK-NEXT: ldtclr x0, xzr, [x2] // encoding: [0x5f,0x14,0x20,0x59]
+# CHECK-NEXT: ldtclr x2, xzr, [sp] // encoding: [0xff,0x17,0x22,0x59]
+
+# CHECK: ldtset w0, wzr, [x2] // encoding: [0x5f,0x34,0x20,0x19]
+# CHECK-NEXT: ldtset w2, wzr, [sp] // encoding: [0xff,0x37,0x22,0x19]
+# CHECK-NEXT: ldtset x0, xzr, [x2] // encoding: [0x5f,0x34,0x20,0x59]
+# CHECK-NEXT: ldtset x2, xzr, [sp] // encoding: [0xff,0x37,0x22,0x59]
+
+# CHECK: ldtset w0, wzr, [x2] // encoding: [0x5f,0x34,0x20,0x19]
+# CHECK-NEXT: ldtset w2, wzr, [sp] // encoding: [0xff,0x37,0x22,0x19]
+# CHECK-NEXT: ldtset x0, xzr, [x2] // encoding: [0x5f,0x34,0x20,0x59]
+# CHECK-NEXT: ldtset x2, xzr, [sp] // encoding: [0xff,0x37,0x22,0x59]
+
+# CHECK: ldtset w0, wzr, [x2] // encoding: [0x5f,0x34,0x20,0x19]
+# CHECK-NEXT: ldtset w2, wzr, [sp] // encoding: [0xff,0x37,0x22,0x19]
+# CHECK-NEXT: ldtset x0, xzr, [x2] // encoding: [0x5f,0x34,0x20,0x59]
+# CHECK-NEXT: ldtset x2, xzr, [sp] // encoding: [0xff,0x37,0x22,0x59]
+
+# CHECK: ldtset w0, wzr, [x2] // encoding: [0x5f,0x34,0x20,0x19]
+# CHECK-NEXT: ldtset x2, xzr, [sp] // encoding: [0xff,0x37,0x22,0x59]
+# CHECK-NEXT: ldtset x0, xzr, [x2] // encoding: [0x5f,0x34,0x20,0x59]
+# CHECK-NEXT: ldtset x2, xzr, [sp] // encoding: [0xff,0x37,0x22,0x59]
+
+# CHECK: ldtnp x21, x29, [x2, #504] // encoding: [0x55,0xf4,0x5f,0xe8]
+# CHECK-NEXT: ldtnp x22, x23, [x3, #-512] // encoding: [0x76,0x5c,0x60,0xe8]
+# CHECK-NEXT: ldtnp x24, x25, [x4, #8] // encoding: [0x98,0xe4,0x40,0xe8]
+# CHECK-NEXT: ldtnp q23, q29, [x1, #-1024] // encoding: [0x37,0x74,0x60,0xec]
+
+# CHECK: sttnp x3, x5, [sp] // encoding: [0xe3,0x17,0x00,0xe8]
+# CHECK-NEXT: sttnp x17, x19, [sp, #64] // encoding: [0xf1,0x4f,0x04,0xe8]
+# CHECK-NEXT: sttnp q3, q5, [sp] // encoding: [0xe3,0x17,0x00,0xec]
+# CHECK-NEXT: sttnp q17, q19, [sp, #1008] // encoding: [0xf1,0xcf,0x1f,0xec]
diff --git a/llvm/test/MC/AArch64/armv9.6a-occmo.s b/llvm/test/MC/AArch64/armv9.6a-occmo.s
new file mode 100644
index 00000000000000..8a8b5346b6eeee
--- /dev/null
+++ b/llvm/test/MC/AArch64/armv9.6a-occmo.s
@@ -0,0 +1,14 @@
+# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
+// RUN: llvm-mc -triple aarch64-none-linux-gnu -show-encoding -mattr=+occmo -mattr=+mte < %s | FileCheck %s
+.func:
+ dc civaoc, x12
+ dc cigdvaoc, x0
+ dc cvaoc, x13
+ dc cgdvaoc, x1
+
+# CHECK: .text
+# CHECK-NEXT: .func:
+# CHECK-NEXT: dc civaoc, x12 // encoding: [0x0c,0x7f,0x0b,0xd5]
+# CHECK-NEXT: dc cigdvaoc, x0 // encoding: [0xe0,0x7f,0x0b,0xd5]
+# CHECK-NEXT: dc cvaoc, x13 // encoding: [0x0d,0x7b,0x0b,0xd5]
+# CHECK-NEXT: dc cgdvaoc, x1 // encoding: [0xe1,0x7b,0x0b,0xd5]
diff --git a/llvm/test/MC/AArch64/armv9.6a-pcdphint.s b/llvm/test/MC/AArch64/armv9.6a-pcdphint.s
new file mode 100644
index 00000000000000..698e0b2947de82
--- /dev/null
+++ b/llvm/test/MC/AArch64/armv9.6a-pcdphint.s
@@ -0,0 +1,12 @@
+# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
+// RUN: llvm-mc -triple aarch64 -show-encoding -mattr=+pcdphint %s | FileCheck %s
+
+.func:
+ stshh keep
+ stshh strm
+
+# CHECK: .text
+
+# CHECK: .func:
+# CHECK-NEXT: stshh keep // encoding: [0x1f,0x26,0x03,0xd5]
+# CHECK-NEXT: stshh strm // encoding: [0x3f,0x26,0x03,0xd5]
diff --git a/llvm/test/MC/AArch64/armv9.6a-rme-gpc3.s b/llvm/test/MC/AArch64/armv9.6a-rme-gpc3.s
new file mode 100644
index 00000000000000..c6387ea2ef2abd
--- /dev/null
+++ b/llvm/test/MC/AArch64/armv9.6a-rme-gpc3.s
@@ -0,0 +1,12 @@
+# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
+// RUN: llvm-mc -triple aarch64 -show-encoding %s | FileCheck %s
+.func:
+ apas x0
+ mrs x3, GPCBW_EL3
+ msr GPCBW_EL3, x4
+
+# CHECK: .text
+# CHECK-NEXT: .func:
+# CHECK-NEXT: apas x0 // encoding: [0x1f,0x70,0x0e,0xd5]
+# CHECK-NEXT: mrs x3, GPCBW_EL3 // encoding: [0xa3,0x21,0x3e,0xd5]
+# CHECK-NEXT: msr GPCBW_EL3, x4 // encoding: [0xa4,0x21,0x1e,0xd5]
diff --git a/llvm/test/MC/AArch64/armv9.6a-srmask.s b/llvm/test/MC/AArch64/armv9.6a-srmask.s
new file mode 100644
index 00000000000000..d8a68d1fb671b5
--- /dev/null
+++ b/llvm/test/MC/AArch64/armv9.6a-srmask.s
@@ -0,0 +1,104 @@
+# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
+// RUN: llvm-mc -triple aarch64 -show-encoding < %s 2> %t | FileCheck %s
+
+mrs x3, SCTLRMASK_EL1
+mrs x3, SCTLRMASK_EL2
+mrs x3, SCTLRMASK_EL12
+mrs x3, CPACRMASK_EL1
+mrs x3, CPTRMASK_EL2
+mrs x3, CPACRMASK_EL12
+mrs x3, SCTLR2MASK_EL1
+mrs x3, SCTLR2MASK_EL2
+mrs x3, SCTLR2MASK_EL12
+mrs x3, CPACRALIAS_EL1
+mrs x3, SCTLRALIAS_EL1
+mrs x3, SCTLR2ALIAS_EL1
+mrs x3, TCRMASK_EL1
+mrs x3, TCRMASK_EL2
+mrs x3, TCRMASK_EL12
+mrs x3, TCR2MASK_EL1
+mrs x3, TCR2MASK_EL2
+mrs x3, TCR2MASK_EL12
+mrs x3, TCRALIAS_EL1
+mrs x3, TCR2ALIAS_EL1
+mrs x3, ACTLRMASK_EL1
+mrs x3, ACTLRMASK_EL2
+mrs x3, ACTLRMASK_EL12
+mrs x3, ACTLRALIAS_EL1
+
+msr SCTLRMASK_EL1, x3
+msr SCTLRMASK_EL2, x3
+msr SCTLRMASK_EL12, x3
+msr CPACRMASK_EL1, x3
+msr CPTRMASK_EL2, x3
+msr CPACRMASK_EL12, x3
+msr SCTLR2MASK_EL1, x3
+msr SCTLR2MASK_EL2, x3
+msr SCTLR2MASK_EL12, x3
+msr CPACRALIAS_EL1, x3
+msr SCTLRALIAS_EL1, x3
+msr SCTLR2ALIAS_EL1, x3
+msr TCRMASK_EL1, x3
+msr TCRMASK_EL2, x3
+msr TCRMASK_EL12, x3
+msr TCR2MASK_EL1, x3
+msr TCR2MASK_EL2, x3
+msr TCR2MASK_EL12, x3
+msr TCRALIAS_EL1, x3
+msr TCR2ALIAS_EL1, x3
+msr ACTLRMASK_EL1, x3
+msr ACTLRMASK_EL2, x3
+msr ACTLRMASK_EL12, x3
+msr ACTLRALIAS_EL1, x3
+
+# CHECK: .text
+
+# CHECK: mrs x3, SCTLRMASK_EL1 // encoding: [0x03,0x14,0x38,0xd5]
+# CHECK-NEXT: mrs x3, SCTLRMASK_EL2 // encoding: [0x03,0x14,0x3c,0xd5]
+# CHECK-NEXT: mrs x3, SCTLRMASK_EL12 // encoding: [0x03,0x14,0x3d,0xd5]
+# CHECK-NEXT: mrs x3, CPACRMASK_EL1 // encoding: [0x43,0x14,0x38,0xd5]
+# CHECK-NEXT: mrs x3, CPTRMASK_EL2 // encoding: [0x43,0x14,0x3c,0xd5]
+# CHECK-NEXT: mrs x3, CPACRMASK_EL12 // encoding: [0x43,0x14,0x3d,0xd5]
+# CHECK-NEXT: mrs x3, SCTLR2MASK_EL1 // encoding: [0x63,0x14,0x38,0xd5]
+# CHECK-NEXT: mrs x3, SCTLR2MASK_EL2 // encoding: [0x63,0x14,0x3c,0xd5]
+# CHECK-NEXT: mrs x3, SCTLR2MASK_EL12 // encoding: [0x63,0x14,0x3d,0xd5]
+# CHECK-NEXT: mrs x3, CPACRALIAS_EL1 // encoding: [0x83,0x14,0x38,0xd5]
+# CHECK-NEXT: mrs x3, SCTLRALIAS_EL1 // encoding: [0xc3,0x14,0x38,0xd5]
+# CHECK-NEXT: mrs x3, SCTLR2ALIAS_EL1 // encoding: [0xe3,0x14,0x38,0xd5]
+# CHECK-NEXT: mrs x3, TCRMASK_EL1 // encoding: [0x43,0x27,0x38,0xd5]
+# CHECK-NEXT: mrs x3, TCRMASK_EL2 // encoding: [0x43,0x27,0x3c,0xd5]
+# CHECK-NEXT: mrs x3, TCRMASK_EL12 // encoding: [0x43,0x27,0x3d,0xd5]
+# CHECK-NEXT: mrs x3, TCR2MASK_EL1 // encoding: [0x63,0x27,0x38,0xd5]
+# CHECK-NEXT: mrs x3, TCR2MASK_EL2 // encoding: [0x63,0x27,0x3c,0xd5]
+# CHECK-NEXT: mrs x3, TCR2MASK_EL12 // encoding: [0x63,0x27,0x3d,0xd5]
+# CHECK-NEXT: mrs x3, TCRALIAS_EL1 // encoding: [0xc3,0x27,0x38,0xd5]
+# CHECK-NEXT: mrs x3, TCR2ALIAS_EL1 // encoding: [0xe3,0x27,0x38,0xd5]
+# CHECK-NEXT: mrs x3, ACTLRMASK_EL1 // encoding: [0x23,0x14,0x38,0xd5]
+# CHECK-NEXT: mrs x3, ACTLRMASK_EL2 // encoding: [0x23,0x14,0x3c,0xd5]
+# CHECK-NEXT: mrs x3, ACTLRMASK_EL12 // encoding: [0x23,0x14,0x3d,0xd5]
+# CHECK-NEXT: mrs x3, ACTLRALIAS_EL1 // encoding: [0xa3,0x14,0x38,0xd5]
+
+# CHECK: msr SCTLRMASK_EL1, x3 // encoding: [0x03,0x14,0x18,0xd5]
+# CHECK-NEXT: msr SCTLRMASK_EL2, x3 // encoding: [0x03,0x14,0x1c,0xd5]
+# CHECK-NEXT: msr SCTLRMASK_EL12, x3 // encoding: [0x03,0x14,0x1d,0xd5]
+# CHECK-NEXT: msr CPACRMASK_EL1, x3 // encoding: [0x43,0x14,0x18,0xd5]
+# CHECK-NEXT: msr CPTRMASK_EL2, x3 // encoding: [0x43,0x14,0x1c,0xd5]
+# CHECK-NEXT: msr CPACRMASK_EL12, x3 // encoding: [0x43,0x14,0x1d,0xd5]
+# CHECK-NEXT: msr SCTLR2MASK_EL1, x3 // encoding: [0x63,0x14,0x18,0xd5]
+# CHECK-NEXT: msr SCTLR2MASK_EL2, x3 // encoding: [0x63,0x14,0x1c,0xd5]
+# CHECK-NEXT: msr SCTLR2MASK_EL12, x3 // encoding: [0x63,0x14,0x1d,0xd5]
+# CHECK-NEXT: msr CPACRALIAS_EL1, x3 // encoding: [0x83,0x14,0x18,0xd5]
+# CHECK-NEXT: msr SCTLRALIAS_EL1, x3 // encoding: [0xc3,0x14,0x18,0xd5]
+# CHECK-NEXT: msr SCTLR2ALIAS_EL1, x3 // encoding: [0xe3,0x14,0x18,0xd5]
+# CHECK-NEXT: msr TCRMASK_EL1, x3 // encoding: [0x43,0x27,0x18,0xd5]
+# CHECK-NEXT: msr TCRMASK_EL2, x3 // encoding: [0x43,0x27,0x1c,0xd5]
+# CHECK-NEXT: msr TCRMASK_EL12, x3 // encoding: [0x43,0x27,0x1d,0xd5]
+# CHECK-NEXT: msr TCR2MASK_EL1, x3 // encoding: [0x63,0x27,0x18,0xd5]
+# CHECK-NEXT: msr TCR2MASK_EL2, x3 // encoding: [0x63,0x27,0x1c,0xd5]
+# CHECK-NEXT: msr TCR2MASK_EL12, x3 // encoding: [0x63,0x27,0x1d,0xd5]
+# CHECK-NEXT: msr TCRALIAS_EL1, x3 // encoding: [0xc3,0x27,0x18,0xd5]
+# CHECK-NEXT: msr TCR2ALIAS_EL1, x3 // encoding: [0xe3,0x27,0x18,0xd5]
+# CHECK-NEXT: msr ACTLRMASK_EL1, x3 // encoding: [0x23,0x14,0x18,0xd5]
+# CHECK-NEXT: msr ACTLRMASK_EL2, x3 // encoding: [0x23,0x14,0x1c,0xd5]
+# CHECK-NEXT: msr ACTLRMASK_EL12, x3 // encoding: [0x23,0x14,0x1d,0xd5]
+# CHECK-NEXT: msr ACTLRALIAS_EL1, x3 // encoding: [0xa3,0x14,0x18,0xd5]
diff --git a/llvm/test/MC/Disassembler/AArch64/armv9.6a-lsui.txt b/llvm/test/MC/Disassembler/AArch64/armv9.6a-lsui.txt
new file mode 100644
index 00000000000000..7073ade6a309b6
--- /dev/null
+++ b/llvm/test/MC/Disassembler/AArch64/armv9.6a-lsui.txt
@@ -0,0 +1,324 @@
+# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
+# RUN: llvm-mc -triple aarch64 -mattr=+lsui -disassemble %s | FileCheck %s
+
+# LDTXR and STTXR
+[0xe9,0x7f,0x5f,0xc9]
+[0xe9,0x7f,0x5f,0xc9]
+[0x6a,0x7d,0x5f,0xc9]
+[0x6a,0x7d,0x5f,0xc9]
+
+[0xe4,0x7f,0x1f,0x89]
+[0xe4,0x7f,0x1f,0x89]
+[0xe6,0x7c,0x05,0xc9]
+[0xe6,0x7c,0x05,0xc9]
+
+# LDATXR and STLTXR
+[0xe9,0xff,0x5f,0xc9]
+[0x6a,0xfd,0x5f,0xc9]
+
+[0xe4,0xff,0x02,0x89]
+[0xe6,0xfc,0x05,0xc9]
+
+# STTP and LDTP
+[0x55,0xf4,0x5f,0xe9]
+[0x76,0x5c,0x60,0xe9]
+[0x98,0xe4,0x40,0xe9]
+
+[0xe3,0x17,0x81,0xe8]
+[0xe3,0x97,0x80,0xe9]
+[0xe3,0x17,0x00,0xed]
+[0xf1,0xcf,0x1f,0xed]
+
+[0x55,0xf4,0xdf,0xe8]
+[0x76,0x5c,0xe0,0xe8]
+[0x98,0xe4,0xc0,0xe8]
+
+[0xe3,0x17,0x80,0xec]
+[0xf1,0xcf,0x9f,0xec]
+[0x37,0x74,0xe0,0xec]
+
+[0x55,0xf4,0xdf,0xe9]
+[0x76,0x5c,0xe0,0xe9]
+[0x98,0xe4,0xc0,0xe9]
+
+[0xe3,0x17,0x80,0xed]
+[0xf1,0xcf,0x9f,0xed]
+[0x37,0x74,0xe0,0xed]
+
+[0x55,0xf4,0x5f,0xe8]
+[0x76,0x5c,0x60,0xe8]
+[0x98,0xe4,0x40,0xe8]
+[0x37,0x74,0x60,0xec]
+
+[0xe3,0x17,0x00,0xe8]
+[0xf1,0x4f,0x04,0xe8]
+[0xe3,0x17,0x00,0xec]
+[0xf1,0xcf,0x1f,0xec]
+
+# SWPT{A|L}
+[0xbf,0x84,0x27,0x19]
+[0xff,0x87,0x29,0x59]
+
+[0xbf,0x84,0xa7,0x19]
+[0xff,0x87,0xa9,0x59]
+
+[0xbf,0x84,0x67,0x19]
+[0xff,0x87,0x69,0x59]
+
+[0xbf,0x84,0xe7,0x19]
+[0xff,0x87,0xe9,0x59]
+
+# CAS{A|L}T
+[0x41,0x7c,0x80,0xc9]
+[0xe1,0x7f,0x80,0xc9]
+[0x41,0x7c,0xc0,0xc9]
+[0xe1,0x7f,0xc0,0xc9]
+[0x41,0xfc,0xc0,0xc9]
+[0xe1,0xff,0xc0,0xc9]
+[0x41,0xfc,0x80,0xc9]
+[0xe1,0xff,0x80,0xc9]
+
+# CASP{A|L}T
+[0x82,0x7c,0x80,0x49]
+[0xe2,0x7f,0x80,0x49]
+[0x82,0x7c,0xc0,0x49]
+[0xe2,0x7f,0xc0,0x49]
+[0x82,0xfc,0x80,0x49]
+[0xe2,0xff,0x80,0x49]
+[0x82,0xfc,0xc0,0x49]
+[0xe2,0xff,0xc0,0x49]
+
+#LDT{SET|ADD|CLR}{A|L} and STT{ADD|SET|CLR}{L}
+
+[0xbf,0x04,0x27,0x19]
+[0xff,0x07,0x29,0x59]
+
+[0xbf,0x04,0xa7,0x19]
+[0xff,0x07,0xa9,0x59]
+
+[0xbf,0x04,0x67,0x19]
+[0xff,0x07,0x69,0x59]
+
+[0xbf,0x04,0xe7,0x19]
+[0xff,0x07,0xe9,0x59]
+
+[0xbf,0x14,0x27,0x19]
+[0xff,0x17,0x29,0x59]
+
+[0xbf,0x14,0x67,0x19]
+[0xff,0x17,0x69,0x59]
+
+[0xbf,0x14,0xa7,0x19]
+[0xff,0x17,0xa9,0x59]
+
+[0xbf,0x14,0xe7,0x19]
+[0xff,0x17,0xe9,0x59]
+
+[0xbf,0x34,0x27,0x19]
+[0xff,0x37,0x29,0x59]
+
+[0xbf,0x34,0x67,0x19]
+[0xff,0x37,0x69,0x59]
+
+[0xbf,0x34,0xa7,0x19]
+[0xff,0x37,0xa9,0x59]
+
+[0xbf,0x34,0xe7,0x19]
+[0xff,0x37,0xe9,0x59]
+
+[0x5f,0x04,0x20,0x19]
+[0xff,0x07,0x22,0x19]
+[0x5f,0x04,0x20,0x59]
+[0xff,0x07,0x22,0x59]
+
+[0x5f,0x04,0x20,0x19]
+[0xff,0x07,0x22,0x19]
+[0x5f,0x04,0x20,0x59]
+[0xff,0x07,0x22,0x59]
+
+[0x5f,0x04,0x20,0x19]
+[0xff,0x07,0x22,0x19]
+[0x5f,0x04,0x20,0x59]
+[0xff,0x07,0x22,0x59]
+
+[0x5f,0x04,0x20,0x19]
+[0xff,0x07,0x22,0x19]
+[0x5f,0x04,0x20,0x59]
+[0xff,0x07,0x22,0x59]
+
+[0x5f,0x14,0x20,0x19]
+[0xff,0x17,0x22,0x19]
+[0x5f,0x14,0x20,0x59]
+[0xff,0x17,0x22,0x59]
+
+[0x5f,0x14,0x20,0x19]
+[0xff,0x17,0x22,0x19]
+[0x5f,0x14,0x20,0x59]
+[0xff,0x17,0x22,0x59]
+
+[0x5f,0x14,0x20,0x19]
+[0xff,0x17,0x22,0x19]
+[0x5f,0x14,0x20,0x59]
+[0xff,0x17,0x22,0x59]
+
+[0x5f,0x14,0x20,0x19]
+[0xff,0x17,0x22,0x59]
+[0x5f,0x14,0x20,0x59]
+[0xff,0x17,0x22,0x59]
+
+[0x5f,0x34,0x20,0x19]
+[0xff,0x37,0x22,0x19]
+[0x5f,0x34,0x20,0x59]
+[0xff,0x37,0x22,0x59]
+
+[0x5f,0x34,0x20,0x19]
+[0xff,0x37,0x22,0x19]
+[0x5f,0x34,0x20,0x59]
+[0xff,0x37,0x22,0x59]
+
+[0x5f,0x34,0x20,0x19]
+[0xff,0x37,0x22,0x19]
+[0x5f,0x34,0x20,0x59]
+[0xff,0x37,0x22,0x59]
+
+[0x5f,0x34,0x20,0x19]
+[0xff,0x37,0x22,0x59]
+[0x5f,0x34,0x20,0x59]
+[0xff,0x37,0x22,0x59]
+
+# CHECK: .text
+# CHECK-NEXT: ldtxr x9, [sp]
+# CHECK-NEXT: ldtxr x9, [sp]
+# CHECK-NEXT: ldtxr x10, [x11]
+# CHECK-NEXT: ldtxr x10, [x11]
+# CHECK-NEXT: sttxr wzr, w4, [sp]
+# CHECK-NEXT: sttxr wzr, w4, [sp]
+# CHECK-NEXT: sttxr w5, x6, [x7]
+# CHECK-NEXT: sttxr w5, x6, [x7]
+# CHECK-NEXT: ldatxr x9, [sp]
+# CHECK-NEXT: ldatxr x10, [x11]
+# CHECK-NEXT: stltxr w2, w4, [sp]
+# CHECK-NEXT: stltxr w5, x6, [x7]
+# CHECK-NEXT: ldtp x21, x29, [x2, #504]
+# CHECK-NEXT: ldtp x22, x23, [x3, #-512]
+# CHECK-NEXT: ldtp x24, x25, [x4, #8]
+# CHECK-NEXT: sttp x3, x5, [sp], #16
+# CHECK-NEXT: sttp x3, x5, [sp, #8]!
+# CHECK-NEXT: sttp q3, q5, [sp]
+# CHECK-NEXT: sttp q17, q19, [sp, #1008]
+# CHECK-NEXT: ldtp x21, x29, [x2], #504
+# CHECK-NEXT: ldtp x22, x23, [x3], #-512
+# CHECK-NEXT: ldtp x24, x25, [x4], #8
+# CHECK-NEXT: sttp q3, q5, [sp], #0
+# CHECK-NEXT: sttp q17, q19, [sp], #1008
+# CHECK-NEXT: ldtp q23, q29, [x1], #-1024
+# CHECK-NEXT: ldtp x21, x29, [x2, #504]!
+# CHECK-NEXT: ldtp x22, x23, [x3, #-512]!
+# CHECK-NEXT: ldtp x24, x25, [x4, #8]!
+# CHECK-NEXT: sttp q3, q5, [sp, #0]!
+# CHECK-NEXT: sttp q17, q19, [sp, #1008]!
+# CHECK-NEXT: ldtp q23, q29, [x1, #-1024]!
+# CHECK-NEXT: ldtnp x21, x29, [x2, #504]
+# CHECK-NEXT: ldtnp x22, x23, [x3, #-512]
+# CHECK-NEXT: ldtnp x24, x25, [x4, #8]
+# CHECK-NEXT: ldtnp q23, q29, [x1, #-1024]
+# CHECK-NEXT: sttnp x3, x5, [sp]
+# CHECK-NEXT: sttnp x17, x19, [sp, #64]
+# CHECK-NEXT: sttnp q3, q5, [sp]
+# CHECK-NEXT: sttnp q17, q19, [sp, #1008]
+# CHECK-NEXT: swpt w7, wzr, [x5]
+# CHECK-NEXT: swpt x9, xzr, [sp]
+# CHECK-NEXT: swpta w7, wzr, [x5]
+# CHECK-NEXT: swpta x9, xzr, [sp]
+# CHECK-NEXT: swptl w7, wzr, [x5]
+# CHECK-NEXT: swptl x9, xzr, [sp]
+# CHECK-NEXT: swptal w7, wzr, [x5]
+# CHECK-NEXT: swptal x9, xzr, [sp]
+# CHECK-NEXT: cast x0, x1, [x2]
+# CHECK-NEXT: cast x0, x1, [sp]
+# CHECK-NEXT: casat x0, x1, [x2]
+# CHECK-NEXT: casat x0, x1, [sp]
+# CHECK-NEXT: casalt x0, x1, [x2]
+# CHECK-NEXT: casalt x0, x1, [sp]
+# CHECK-NEXT: caslt x0, x1, [x2]
+# CHECK-NEXT: caslt x0, x1, [sp]
+# CHECK-NEXT: caspt x0, x1, x2, x3, [x4]
+# CHECK-NEXT: caspt x0, x1, x2, x3, [sp]
+# CHECK-NEXT: caspat x0, x1, x2, x3, [x4]
+# CHECK-NEXT: caspat x0, x1, x2, x3, [sp]
+# CHECK-NEXT: casplt x0, x1, x2, x3, [x4]
+# CHECK-NEXT: casplt x0, x1, x2, x3, [sp]
+# CHECK-NEXT: caspalt x0, x1, x2, x3, [x4]
+# CHECK-NEXT: caspalt x0, x1, x2, x3, [sp]
+# CHECK-NEXT: ldtadd w7, wzr, [x5]
+# CHECK-NEXT: ldtadd x9, xzr, [sp]
+# CHECK-NEXT: ldtadda w7, wzr, [x5]
+# CHECK-NEXT: ldtadda x9, xzr, [sp]
+# CHECK-NEXT: ldtaddl w7, wzr, [x5]
+# CHECK-NEXT: ldtaddl x9, xzr, [sp]
+# CHECK-NEXT: ldtaddal w7, wzr, [x5]
+# CHECK-NEXT: ldtaddal x9, xzr, [sp]
+# CHECK-NEXT: ldtclr w7, wzr, [x5]
+# CHECK-NEXT: ldtclr x9, xzr, [sp]
+# CHECK-NEXT: ldtclrl w7, wzr, [x5]
+# CHECK-NEXT: ldtclrl x9, xzr, [sp]
+# CHECK-NEXT: ldtclra w7, wzr, [x5]
+# CHECK-NEXT: ldtclra x9, xzr, [sp]
+# CHECK-NEXT: ldtclral w7, wzr, [x5]
+# CHECK-NEXT: ldtclral x9, xzr, [sp]
+# CHECK-NEXT: ldtset w7, wzr, [x5]
+# CHECK-NEXT: ldtset x9, xzr, [sp]
+# CHECK-NEXT: ldtsetl w7, wzr, [x5]
+# CHECK-NEXT: ldtsetl x9, xzr, [sp]
+# CHECK-NEXT: ldtseta w7, wzr, [x5]
+# CHECK-NEXT: ldtseta x9, xzr, [sp]
+# CHECK-NEXT: ldtsetal w7, wzr, [x5]
+# CHECK-NEXT: ldtsetal x9, xzr, [sp]
+# CHECK-NEXT: ldtadd w0, wzr, [x2]
+# CHECK-NEXT: ldtadd w2, wzr, [sp]
+# CHECK-NEXT: ldtadd x0, xzr, [x2]
+# CHECK-NEXT: ldtadd x2, xzr, [sp]
+# CHECK-NEXT: ldtadd w0, wzr, [x2]
+# CHECK-NEXT: ldtadd w2, wzr, [sp]
+# CHECK-NEXT: ldtadd x0, xzr, [x2]
+# CHECK-NEXT: ldtadd x2, xzr, [sp]
+# CHECK-NEXT: ldtadd w0, wzr, [x2]
+# CHECK-NEXT: ldtadd w2, wzr, [sp]
+# CHECK-NEXT: ldtadd x0, xzr, [x2]
+# CHECK-NEXT: ldtadd x2, xzr, [sp]
+# CHECK-NEXT: ldtadd w0, wzr, [x2]
+# CHECK-NEXT: ldtadd w2, wzr, [sp]
+# CHECK-NEXT: ldtadd x0, xzr, [x2]
+# CHECK-NEXT: ldtadd x2, xzr, [sp]
+# CHECK-NEXT: ldtclr w0, wzr, [x2]
+# CHECK-NEXT: ldtclr w2, wzr, [sp]
+# CHECK-NEXT: ldtclr x0, xzr, [x2]
+# CHECK-NEXT: ldtclr x2, xzr, [sp]
+# CHECK-NEXT: ldtclr w0, wzr, [x2]
+# CHECK-NEXT: ldtclr w2, wzr, [sp]
+# CHECK-NEXT: ldtclr x0, xzr, [x2]
+# CHECK-NEXT: ldtclr x2, xzr, [sp]
+# CHECK-NEXT: ldtclr w0, wzr, [x2]
+# CHECK-NEXT: ldtclr w2, wzr, [sp]
+# CHECK-NEXT: ldtclr x0, xzr, [x2]
+# CHECK-NEXT: ldtclr x2, xzr, [sp]
+# CHECK-NEXT: ldtclr w0, wzr, [x2]
+# CHECK-NEXT: ldtclr x2, xzr, [sp]
+# CHECK-NEXT: ldtclr x0, xzr, [x2]
+# CHECK-NEXT: ldtclr x2, xzr, [sp]
+# CHECK-NEXT: ldtset w0, wzr, [x2]
+# CHECK-NEXT: ldtset w2, wzr, [sp]
+# CHECK-NEXT: ldtset x0, xzr, [x2]
+# CHECK-NEXT: ldtset x2, xzr, [sp]
+# CHECK-NEXT: ldtset w0, wzr, [x2]
+# CHECK-NEXT: ldtset w2, wzr, [sp]
+# CHECK-NEXT: ldtset x0, xzr, [x2]
+# CHECK-NEXT: ldtset x2, xzr, [sp]
+# CHECK-NEXT: ldtset w0, wzr, [x2]
+# CHECK-NEXT: ldtset w2, wzr, [sp]
+# CHECK-NEXT: ldtset x0, xzr, [x2]
+# CHECK-NEXT: ldtset x2, xzr, [sp]
+# CHECK-NEXT: ldtset w0, wzr, [x2]
+# CHECK-NEXT: ldtset x2, xzr, [sp]
+# CHECK-NEXT: ldtset x0, xzr, [x2]
+# CHECK-NEXT: ldtset x2, xzr, [sp]
diff --git a/llvm/test/MC/Disassembler/AArch64/armv9.6a-occmo.txt b/llvm/test/MC/Disassembler/AArch64/armv9.6a-occmo.txt
new file mode 100644
index 00000000000000..ccc65e747bc0b4
--- /dev/null
+++ b/llvm/test/MC/Disassembler/AArch64/armv9.6a-occmo.txt
@@ -0,0 +1,12 @@
+# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
+# RUN: llvm-mc -triple aarch64-none-linux-gnu -mattr=+occmo -mattr=+mte -disassemble < %s | FileCheck %s
+[0x0c,0x7f,0x0b,0xd5]
+[0xe0,0x7f,0x0b,0xd5]
+[0x0d,0x7b,0x0b,0xd5]
+[0xe1,0x7b,0x0b,0xd5]
+
+# CHECK: .text
+# CHECK-NEXT: dc civaoc, x12
+# CHECK-NEXT: dc cigdvaoc, x0
+# CHECK-NEXT: dc cvaoc, x13
+# CHECK-NEXT: dc cgdvaoc, x1
diff --git a/llvm/test/MC/Disassembler/AArch64/armv9.6a-pcdphint.txt b/llvm/test/MC/Disassembler/AArch64/armv9.6a-pcdphint.txt
new file mode 100644
index 00000000000000..1e21455b1edf49
--- /dev/null
+++ b/llvm/test/MC/Disassembler/AArch64/armv9.6a-pcdphint.txt
@@ -0,0 +1,9 @@
+# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
+# RUN: llvm-mc -triple aarch64 -disassemble -mattr=+pcdphint %s | FileCheck %s
+
+[0x1f,0x26,0x03,0xd5]
+[0x3f,0x26,0x03,0xd5]
+
+# CHECK: .text
+# CHECK-NEXT: stshh keep
+# CHECK-NEXT: stshh strm
diff --git a/llvm/test/MC/Disassembler/AArch64/armv9.6a-rme-gpc3.txt b/llvm/test/MC/Disassembler/AArch64/armv9.6a-rme-gpc3.txt
new file mode 100644
index 00000000000000..a641731b2f1b2a
--- /dev/null
+++ b/llvm/test/MC/Disassembler/AArch64/armv9.6a-rme-gpc3.txt
@@ -0,0 +1,11 @@
+# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
+# RUN: llvm-mc -triple aarch64 -disassemble %s | FileCheck %s
+
+[0x1f,0x70,0x0e,0xd5]
+[0xa3,0x21,0x3e,0xd5]
+[0xa4,0x21,0x1e,0xd5]
+
+# CHECK: .text
+# CHECK-NEXT: sys #6, c7, c0, #0
+# CHECK-NEXT: mrs x3, GPCBW_EL3
+# CHECK-NEXT: msr GPCBW_EL3, x4
diff --git a/llvm/test/MC/Disassembler/AArch64/armv9.6a-srmask.txt b/llvm/test/MC/Disassembler/AArch64/armv9.6a-srmask.txt
new file mode 100644
index 00000000000000..1401af18aad5d3
--- /dev/null
+++ b/llvm/test/MC/Disassembler/AArch64/armv9.6a-srmask.txt
@@ -0,0 +1,102 @@
+# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
+# RUN: llvm-mc -triple aarch64 -disassemble < %s 2> %t | FileCheck %s
+
+[0x03,0x14,0x38,0xd5]
+[0x03,0x14,0x3c,0xd5]
+[0x03,0x14,0x3d,0xd5]
+[0x43,0x14,0x38,0xd5]
+[0x43,0x14,0x3c,0xd5]
+[0x43,0x14,0x3d,0xd5]
+[0x63,0x14,0x38,0xd5]
+[0x63,0x14,0x3c,0xd5]
+[0x63,0x14,0x3d,0xd5]
+[0x83,0x14,0x38,0xd5]
+[0xc3,0x14,0x38,0xd5]
+[0xe3,0x14,0x38,0xd5]
+[0x43,0x27,0x38,0xd5]
+[0x43,0x27,0x3c,0xd5]
+[0x43,0x27,0x3d,0xd5]
+[0x63,0x27,0x38,0xd5]
+[0x63,0x27,0x3c,0xd5]
+[0x63,0x27,0x3d,0xd5]
+[0xc3,0x27,0x38,0xd5]
+[0xe3,0x27,0x38,0xd5]
+[0x23,0x14,0x38,0xd5]
+[0x23,0x14,0x3c,0xd5]
+[0x23,0x14,0x3d,0xd5]
+[0xa3,0x14,0x38,0xd5]
+
+[0x03,0x14,0x18,0xd5]
+[0x03,0x14,0x1c,0xd5]
+[0x03,0x14,0x1d,0xd5]
+[0x43,0x14,0x18,0xd5]
+[0x43,0x14,0x1c,0xd5]
+[0x43,0x14,0x1d,0xd5]
+[0x63,0x14,0x18,0xd5]
+[0x63,0x14,0x1c,0xd5]
+[0x63,0x14,0x1d,0xd5]
+[0x83,0x14,0x18,0xd5]
+[0xc3,0x14,0x18,0xd5]
+[0xe3,0x14,0x18,0xd5]
+[0x43,0x27,0x18,0xd5]
+[0x43,0x27,0x1c,0xd5]
+[0x43,0x27,0x1d,0xd5]
+[0x63,0x27,0x18,0xd5]
+[0x63,0x27,0x1c,0xd5]
+[0x63,0x27,0x1d,0xd5]
+[0xc3,0x27,0x18,0xd5]
+[0xe3,0x27,0x18,0xd5]
+[0x23,0x14,0x18,0xd5]
+[0x23,0x14,0x1c,0xd5]
+[0x23,0x14,0x1d,0xd5]
+[0xa3,0x14,0x18,0xd5]
+
+# CHECK: .text
+# CHECK-NEXT: mrs x3, SCTLRMASK_EL1
+# CHECK-NEXT: mrs x3, SCTLRMASK_EL2
+# CHECK-NEXT: mrs x3, SCTLRMASK_EL12
+# CHECK-NEXT: mrs x3, CPACRMASK_EL1
+# CHECK-NEXT: mrs x3, CPTRMASK_EL2
+# CHECK-NEXT: mrs x3, CPACRMASK_EL12
+# CHECK-NEXT: mrs x3, SCTLR2MASK_EL1
+# CHECK-NEXT: mrs x3, SCTLR2MASK_EL2
+# CHECK-NEXT: mrs x3, SCTLR2MASK_EL12
+# CHECK-NEXT: mrs x3, CPACRALIAS_EL1
+# CHECK-NEXT: mrs x3, SCTLRALIAS_EL1
+# CHECK-NEXT: mrs x3, SCTLR2ALIAS_EL1
+# CHECK-NEXT: mrs x3, TCRMASK_EL1
+# CHECK-NEXT: mrs x3, TCRMASK_EL2
+# CHECK-NEXT: mrs x3, TCRMASK_EL12
+# CHECK-NEXT: mrs x3, TCR2MASK_EL1
+# CHECK-NEXT: mrs x3, TCR2MASK_EL2
+# CHECK-NEXT: mrs x3, TCR2MASK_EL12
+# CHECK-NEXT: mrs x3, TCRALIAS_EL1
+# CHECK-NEXT: mrs x3, TCR2ALIAS_EL1
+# CHECK-NEXT: mrs x3, ACTLRMASK_EL1
+# CHECK-NEXT: mrs x3, ACTLRMASK_EL2
+# CHECK-NEXT: mrs x3, ACTLRMASK_EL12
+# CHECK-NEXT: mrs x3, ACTLRALIAS_EL1
+# CHECK-NEXT: msr SCTLRMASK_EL1, x3
+# CHECK-NEXT: msr SCTLRMASK_EL2, x3
+# CHECK-NEXT: msr SCTLRMASK_EL12, x3
+# CHECK-NEXT: msr CPACRMASK_EL1, x3
+# CHECK-NEXT: msr CPTRMASK_EL2, x3
+# CHECK-NEXT: msr CPACRMASK_EL12, x3
+# CHECK-NEXT: msr SCTLR2MASK_EL1, x3
+# CHECK-NEXT: msr SCTLR2MASK_EL2, x3
+# CHECK-NEXT: msr SCTLR2MASK_EL12, x3
+# CHECK-NEXT: msr CPACRALIAS_EL1, x3
+# CHECK-NEXT: msr SCTLRALIAS_EL1, x3
+# CHECK-NEXT: msr SCTLR2ALIAS_EL1, x3
+# CHECK-NEXT: msr TCRMASK_EL1, x3
+# CHECK-NEXT: msr TCRMASK_EL2, x3
+# CHECK-NEXT: msr TCRMASK_EL12, x3
+# CHECK-NEXT: msr TCR2MASK_EL1, x3
+# CHECK-NEXT: msr TCR2MASK_EL2, x3
+# CHECK-NEXT: msr TCR2MASK_EL12, x3
+# CHECK-NEXT: msr TCRALIAS_EL1, x3
+# CHECK-NEXT: msr TCR2ALIAS_EL1, x3
+# CHECK-NEXT: msr ACTLRMASK_EL1, x3
+# CHECK-NEXT: msr ACTLRMASK_EL2, x3
+# CHECK-NEXT: msr ACTLRMASK_EL12, x3
+# CHECK-NEXT: msr ACTLRALIAS_EL1, x3
diff --git a/llvm/unittests/TargetParser/TargetParserTest.cpp b/llvm/unittests/TargetParser/TargetParserTest.cpp
index 5b5d45f6c574bf..28081ae5ec8c15 100644
--- a/llvm/unittests/TargetParser/TargetParserTest.cpp
+++ b/llvm/unittests/TargetParser/TargetParserTest.cpp
@@ -1323,8 +1323,8 @@ TEST(TargetParserTest, AArch64ExtensionFeatures) {
AArch64::AEK_CPA, AArch64::AEK_PAUTHLR,
AArch64::AEK_TLBIW, AArch64::AEK_JSCVT,
AArch64::AEK_FCMA, AArch64::AEK_FP8,
- AArch64::AEK_SVEB16B16,
- };
+ AArch64::AEK_SVEB16B16, AArch64::AEK_LSUI,
+ AArch64::AEK_OCCMO, AArch64::AEK_PCDPHINT};
std::vector<StringRef> Features;
@@ -1413,6 +1413,9 @@ TEST(TargetParserTest, AArch64ExtensionFeatures) {
EXPECT_TRUE(llvm::is_contained(Features, "+tlbiw"));
EXPECT_TRUE(llvm::is_contained(Features, "+jsconv"));
EXPECT_TRUE(llvm::is_contained(Features, "+complxnum"));
+ EXPECT_TRUE(llvm::is_contained(Features, "+lsui"));
+ EXPECT_TRUE(llvm::is_contained(Features, "+occmo"));
+ EXPECT_TRUE(llvm::is_contained(Features, "+pcdphint"));
// Assuming we listed every extension above, this should produce the same
// result.
@@ -1554,6 +1557,9 @@ TEST(TargetParserTest, AArch64ArchExtFeature) {
{"sme-lutv2", "nosme-lutv2", "+sme-lutv2", "-sme-lutv2"},
{"sme-f8f16", "nosme-f8f16", "+sme-f8f16", "-sme-f8f16"},
{"sme-f8f32", "nosme-f8f32", "+sme-f8f32", "-sme-f8f32"},
+ {"lsui", "nolsui", "+lsui", "-lsui"},
+ {"occmo", "nooccmo", "+occmo", "-occmo"},
+ {"pcdphint", "nopcdphint", "+pcdphint", "-pcdphint"},
};
for (unsigned i = 0; i < std::size(ArchExt); i++) {
More information about the cfe-commits
mailing list