[llvm] c3773f7 - [X86][APX] Fix the assertion of NF instruction with relocation (#138500)

via llvm-commits llvm-commits at lists.llvm.org
Mon May 5 08:07:00 PDT 2025


Author: Feng Zou
Date: 2025-05-05T23:06:56+08:00
New Revision: c3773f7ca8615bca2b121de9326437ebe497fca5

URL: https://github.com/llvm/llvm-project/commit/c3773f7ca8615bca2b121de9326437ebe497fca5
DIFF: https://github.com/llvm/llvm-project/commit/c3773f7ca8615bca2b121de9326437ebe497fca5.diff

LOG: [X86][APX] Fix the assertion of NF instruction with relocation (#138500)

The assertion should be raised only for the NF instructions with
GOTTPOFF relocation.

Added: 
    llvm/test/CodeGen/X86/apx/check-nf-in-suppress-reloc-pass.ll

Modified: 
    llvm/lib/Target/X86/X86SuppressAPXForReloc.cpp

Removed: 
    


################################################################################
diff  --git a/llvm/lib/Target/X86/X86SuppressAPXForReloc.cpp b/llvm/lib/Target/X86/X86SuppressAPXForReloc.cpp
index fe7a49ab4771d..d40995cb1786d 100644
--- a/llvm/lib/Target/X86/X86SuppressAPXForReloc.cpp
+++ b/llvm/lib/Target/X86/X86SuppressAPXForReloc.cpp
@@ -155,8 +155,14 @@ static bool handleNDDOrNFInstructions(MachineFunction &MF,
       switch (Opcode) {
       case X86::ADD64rm_NF:
       case X86::ADD64mr_NF_ND:
-      case X86::ADD64rm_NF_ND:
-        llvm_unreachable("Unexpected NF instruction!");
+      case X86::ADD64rm_NF_ND: {
+        int MemOpNo = X86II::getMemoryOperandNo(MI.getDesc().TSFlags) +
+                      X86II::getOperandBias(MI.getDesc());
+        const MachineOperand &MO = MI.getOperand(X86::AddrDisp + MemOpNo);
+        if (MO.getTargetFlags() == X86II::MO_GOTTPOFF)
+          llvm_unreachable("Unexpected NF instruction!");
+        break;
+      }
       case X86::ADD64rm_ND: {
         int MemOpNo = X86II::getMemoryOperandNo(MI.getDesc().TSFlags) +
                       X86II::getOperandBias(MI.getDesc());

diff  --git a/llvm/test/CodeGen/X86/apx/check-nf-in-suppress-reloc-pass.ll b/llvm/test/CodeGen/X86/apx/check-nf-in-suppress-reloc-pass.ll
new file mode 100644
index 0000000000000..3a2c954e37077
--- /dev/null
+++ b/llvm/test/CodeGen/X86/apx/check-nf-in-suppress-reloc-pass.ll
@@ -0,0 +1,83 @@
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
+; RUN: llc < %s -mtriple=x86_64 -mattr=+nf -verify-machineinstrs | FileCheck %s
+
+; This is to check no assertion raised in X86 Suppress APX for Relocation pass
+; if there is a NF instruction
+
+define fastcc void @foo(i32 %0, i1 %or.cond) nounwind {
+; CHECK-LABEL: foo:
+; CHECK:       # %bb.0: # %entry
+; CHECK-NEXT:    pushq %rbp
+; CHECK-NEXT:    pushq %r15
+; CHECK-NEXT:    pushq %r14
+; CHECK-NEXT:    pushq %r13
+; CHECK-NEXT:    pushq %r12
+; CHECK-NEXT:    pushq %rbx
+; CHECK-NEXT:    pushq %rax
+; CHECK-NEXT:    movl %esi, %ebx
+; CHECK-NEXT:    movslq %edi, %r15
+; CHECK-NEXT:    leaq (,%r15,4), %rax
+; CHECK-NEXT:    leaq (%rax,%rax,4), %r14
+; CHECK-NEXT:    movl %r15d, %r12d
+; CHECK-NEXT:    xorl %r13d, %r13d
+; CHECK-NEXT:    xorl %ebp, %ebp
+; CHECK-NEXT:    jmp .LBB0_1
+; CHECK-NEXT:    .p2align 4
+; CHECK-NEXT:  .LBB0_3: # %if.end41
+; CHECK-NEXT:    # in Loop: Header=BB0_1 Depth=1
+; CHECK-NEXT:    leaq (%r12,%rbp), %rdi
+; CHECK-NEXT:    # kill: def $edi killed $edi killed $rdi
+; CHECK-NEXT:    xorl %esi, %esi
+; CHECK-NEXT:    movq %r14, %rdx
+; CHECK-NEXT:    callq *%r13
+; CHECK-NEXT:    incq %rbp
+; CHECK-NEXT:    addq $20, %r14
+; CHECK-NEXT:  .LBB0_1: # %for.body30
+; CHECK-NEXT:    # =>This Inner Loop Header: Depth=1
+; CHECK-NEXT:    testb $1, %bl
+; CHECK-NEXT:    je .LBB0_3
+; CHECK-NEXT:  # %bb.2: # %if.then37
+; CHECK-NEXT:    # in Loop: Header=BB0_1 Depth=1
+; CHECK-NEXT:    movq %r15, %rax
+; CHECK-NEXT:    addq %rbp, %rax
+; CHECK-NEXT:    movq 0, %rax
+; CHECK-NEXT:    {nf} addq %r15, %rax
+; CHECK-NEXT:    movb $0, (%rbp,%rax)
+; CHECK-NEXT:    jmp .LBB0_3
+entry:
+  %1 = sext i32 %0 to i64
+  br label %for.body30
+
+for.body30:                                       ; preds = %if.end41, %entry
+  %indvars.iv = phi i64 [ %1, %entry ], [ %indvars.iv.next, %if.end41 ]
+  %.pre88 = trunc i64 %indvars.iv to i32
+  br label %if.end16.i
+
+if.then9.i:                                       ; No predecessors!
+  call fastcc void null(ptr null, i32 %.pre88)
+  br label %if.end16.i
+
+if.end16.i:                                       ; preds = %if.then9.i, %for.body30
+  br i1 %or.cond, label %if.then37, label %if.end41
+
+if.then37:                                        ; preds = %if.end16.i
+  %2 = load ptr, ptr null, align 8
+  %arrayidx.i = getelementptr i8, ptr %2, i64 %indvars.iv
+  store i8 0, ptr %arrayidx.i, align 1
+  %3 = icmp eq i64 %indvars.iv, 0
+  br i1 %3, label %if.end41, label %if.then.i65
+
+if.then.i65:                                      ; preds = %if.then37
+  %arraydecay.i = getelementptr [5 x float], ptr null, i64 %indvars.iv, i64 -5
+  %4 = call <5 x float> @llvm.masked.load.v5f32.p0(ptr %arraydecay.i, i32 1, <5 x i1> zeroinitializer, <5 x float> zeroinitializer)
+  br label %if.end41
+
+if.end41:                                         ; preds = %if.then.i65, %if.then37, %if.end16.i
+  %arraydecay44 = getelementptr [5 x float], ptr null, i64 %indvars.iv, i64 0
+  call fastcc void null(i32 %.pre88, i32 0, ptr %arraydecay44)
+  %indvars.iv.next = add i64 %indvars.iv, 1
+  %cmp29 = icmp slt i64 %indvars.iv, 0
+  br label %for.body30
+}
+
+declare <5 x float> @llvm.masked.load.v5f32.p0(ptr captures(none), i32 immarg, <5 x i1>, <5 x float>)


        


More information about the llvm-commits mailing list