[AMDGPU] Apply alignment attr for make.buffer.rsrc #166914

Shoreshen · 2025-11-07T09:56:41Z

Calculating alignment for make.buffer.rsrc intrinsic. The logic is the alignment on use of return value of make.buffer.rsrc should be capped by the base operand's alignment of make.buffer.rsrc.

For example:

define float @foo(ptr addrspace(1) align X %ptr) {
  %fat.ptr = call ptr addrspace(7) @llvm.amdgcn.make.buffer.rsrc.p7.p1(ptr addrspace(1) %ptr, i16 0, i32 C, i32 0)
  %y = load float, ptr addrspace(7) %fat.ptr, align Y
  ret float %y
}

We hopes that Y = min(X, Y)

After discussion, it seems improper for letting Y = min(X, Y) since it contradict with the semantic of align on load.

So we would apply the origin behavior of align, which is letting X and Y both equal to max(X, Y)

llvmbot · 2025-11-07T09:57:11Z

@llvm/pr-subscribers-clang
@llvm/pr-subscribers-llvm-transforms

@llvm/pr-subscribers-backend-amdgpu

Author: None (Shoreshen)

Changes

Calculating alignment for make.buffer.rsrc intrinsic. The logic is the alignment on use of return value of make.buffer.rsrc should be capped by the base operand's alignment of make.buffer.rsrc.

For example:

define float @<!-- -->foo(ptr addrspace(1) align X %ptr) {
  %fat.ptr = call ptr addrspace(7) @<!-- -->llvm.amdgcn.make.buffer.rsrc.p7.p1(ptr addrspace(1) %ptr, i16 0, i32 C, i32 0)
  %y = load float, ptr addrspace(7) %fat.ptr, align Y
  ret float %y
}

It hopes that Y = min(X, Y)

Full diff: https://github.com/llvm/llvm-project/pull/166914.diff

4 Files Affected:

(modified) llvm/lib/Target/AMDGPU/AMDGPUAttributor.cpp (+4-1)
(modified) llvm/lib/Transforms/IPO/AttributorAttributes.cpp (+34-4)
(added) llvm/test/CodeGen/AMDGPU/attr-amdgpu-align.ll (+26)
(modified) llvm/test/Transforms/Attributor/AMDGPU/tag-invariant-loads.ll (+2-2)

diff --git a/llvm/lib/Target/AMDGPU/AMDGPUAttributor.cpp b/llvm/lib/Target/AMDGPU/AMDGPUAttributor.cpp
index 56ab040706a13..70f2fbae08ada 100644
--- a/llvm/lib/Target/AMDGPU/AMDGPUAttributor.cpp
+++ b/llvm/lib/Target/AMDGPU/AMDGPUAttributor.cpp
@@ -1603,7 +1603,7 @@ static bool runImpl(Module &M, AnalysisGetter &AG, TargetMachine &TM,
        &AAAMDGPUMinAGPRAlloc::ID, &AACallEdges::ID, &AAPointerInfo::ID,
        &AAPotentialConstantValues::ID, &AAUnderlyingObjects::ID,
        &AANoAliasAddrSpace::ID, &AAAddressSpace::ID, &AAIndirectCallInfo::ID,
-       &AAAMDGPUClusterDims::ID});
+       &AAAMDGPUClusterDims::ID, &AAAlign::ID});
 
   AttributorConfig AC(CGUpdater);
   AC.IsClosedWorldModule = Options.IsClosedWorld;
@@ -1657,6 +1657,9 @@ static bool runImpl(Module &M, AnalysisGetter &AG, TargetMachine &TM,
         Ptr = RMW->getPointerOperand();
       else if (auto *CmpX = dyn_cast<AtomicCmpXchgInst>(&I))
         Ptr = CmpX->getPointerOperand();
+      else if (const IntrinsicInst *II = dyn_cast<IntrinsicInst>(&I))
+        if (II->getIntrinsicID() == Intrinsic::amdgcn_make_buffer_rsrc)
+          A.getOrCreateAAFor<AAAlign>(IRPosition::value(*II));
 
       if (Ptr) {
         A.getOrCreateAAFor<AAAddressSpace>(IRPosition::value(*Ptr));
diff --git a/llvm/lib/Transforms/IPO/AttributorAttributes.cpp b/llvm/lib/Transforms/IPO/AttributorAttributes.cpp
index a6ac7610a2c7a..37ff282343889 100644
--- a/llvm/lib/Transforms/IPO/AttributorAttributes.cpp
+++ b/llvm/lib/Transforms/IPO/AttributorAttributes.cpp
@@ -5279,6 +5279,12 @@ struct AAAlignImpl : AAAlign {
 
   /// See AbstractAttribute::initialize(...).
   void initialize(Attributor &A) override {
+    // For make.buffer.rsrc, the alignment strictly equals to the base's
+    // alignment
+    if (Instruction *I = dyn_cast<Instruction>(&getAssociatedValue()))
+      if (const IntrinsicInst *II = dyn_cast<IntrinsicInst>(I))
+        if (II->getIntrinsicID() == Intrinsic::amdgcn_make_buffer_rsrc)
+          return;
     SmallVector<Attribute, 4> Attrs;
     A.getAttrs(getIRPosition(), {Attribute::Alignment}, Attrs);
     for (const Attribute &Attr : Attrs)
@@ -5300,10 +5306,19 @@ struct AAAlignImpl : AAAlign {
     if (isa<ConstantData>(AssociatedValue))
       return ChangeStatus::UNCHANGED;
 
+    // For use of amdgcn.make.buffer.rsrc, the alignment equals to
+    // min(base, load/store)
+    bool IsMakeBufferRsrc = false;
+    if (Instruction *I = dyn_cast<Instruction>(&getAssociatedValue()))
+      if (const IntrinsicInst *II = dyn_cast<IntrinsicInst>(I))
+        if (II->getIntrinsicID() == Intrinsic::amdgcn_make_buffer_rsrc)
+          IsMakeBufferRsrc = true;
     for (const Use &U : AssociatedValue.uses()) {
       if (auto *SI = dyn_cast<StoreInst>(U.getUser())) {
         if (SI->getPointerOperand() == &AssociatedValue)
-          if (SI->getAlign() < getAssumedAlign()) {
+          if (IsMakeBufferRsrc) {
+            SI->setAlignment(std::min(SI->getAlign(), getAssumedAlign()));
+          } else if (SI->getAlign() < getAssumedAlign()) {
             STATS_DECLTRACK(AAAlign, Store,
                             "Number of times alignment added to a store");
             SI->setAlignment(getAssumedAlign());
@@ -5311,14 +5326,18 @@ struct AAAlignImpl : AAAlign {
           }
       } else if (auto *LI = dyn_cast<LoadInst>(U.getUser())) {
         if (LI->getPointerOperand() == &AssociatedValue)
-          if (LI->getAlign() < getAssumedAlign()) {
+          if (IsMakeBufferRsrc) {
+            LI->setAlignment(std::min(LI->getAlign(), getAssumedAlign()));
+          } else if (LI->getAlign() < getAssumedAlign()) {
             LI->setAlignment(getAssumedAlign());
             STATS_DECLTRACK(AAAlign, Load,
                             "Number of times alignment added to a load");
             InstrChanged = ChangeStatus::CHANGED;
           }
       } else if (auto *RMW = dyn_cast<AtomicRMWInst>(U.getUser())) {
-        if (RMW->getPointerOperand() == &AssociatedValue) {
+        if (IsMakeBufferRsrc) {
+          RMW->setAlignment(std::min(RMW->getAlign(), getAssumedAlign()));
+        } else if (RMW->getPointerOperand() == &AssociatedValue) {
           if (RMW->getAlign() < getAssumedAlign()) {
             STATS_DECLTRACK(AAAlign, AtomicRMW,
                             "Number of times alignment added to atomicrmw");
@@ -5328,7 +5347,9 @@ struct AAAlignImpl : AAAlign {
           }
         }
       } else if (auto *CAS = dyn_cast<AtomicCmpXchgInst>(U.getUser())) {
-        if (CAS->getPointerOperand() == &AssociatedValue) {
+        if (IsMakeBufferRsrc) {
+          CAS->setAlignment(std::min(CAS->getAlign(), getAssumedAlign()));
+        } else if (CAS->getPointerOperand() == &AssociatedValue) {
           if (CAS->getAlign() < getAssumedAlign()) {
             STATS_DECLTRACK(AAAlign, AtomicCmpXchg,
                             "Number of times alignment added to cmpxchg");
@@ -5554,6 +5575,15 @@ struct AAAlignCallSiteReturned final
               std::min(this->getAssumedAlign(), Alignment).value());
         break;
       }
+      case Intrinsic::amdgcn_make_buffer_rsrc: {
+        const auto *AlignAA =
+            A.getAAFor<AAAlign>(*this, IRPosition::value(*(II->getOperand(0))),
+                                DepClassTy::REQUIRED);
+        if (AlignAA && AlignAA->isValidState())
+          return clampStateAndIndicateChange<StateType>(
+              this->getState(), AlignAA->getAssumedAlign().value());
+        break;
+      }
       default:
         break;
       }
diff --git a/llvm/test/CodeGen/AMDGPU/attr-amdgpu-align.ll b/llvm/test/CodeGen/AMDGPU/attr-amdgpu-align.ll
new file mode 100644
index 0000000000000..8d2bfab09460b
--- /dev/null
+++ b/llvm/test/CodeGen/AMDGPU/attr-amdgpu-align.ll
@@ -0,0 +1,26 @@
+; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 6
+; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-attributor %s -o - | FileCheck %s
+
+define float @load_gt_base(ptr align 4 %p) {
+; CHECK-LABEL: define float @load_gt_base(
+; CHECK-SAME: ptr align 4 [[P:%.*]]) #[[ATTR0:[0-9]+]] {
+; CHECK-NEXT:    [[PTR:%.*]] = call align 4 ptr addrspace(7) @llvm.amdgcn.make.buffer.rsrc.p7.p0(ptr align 4 [[P]], i16 0, i64 0, i32 0)
+; CHECK-NEXT:    [[LOADED:%.*]] = load float, ptr addrspace(7) [[PTR]], align 4
+; CHECK-NEXT:    ret float [[LOADED]]
+;
+  %ptr = call ptr addrspace(7) @llvm.amdgcn.make.buffer.rsrc.p7.p0(ptr %p, i16 0, i64 0, i32 0)
+  %loaded = load float, ptr addrspace(7) %ptr, align 8
+  ret float %loaded
+}
+
+define float @load_lt_base(ptr align 8 %p) {
+; CHECK-LABEL: define float @load_lt_base(
+; CHECK-SAME: ptr align 8 [[P:%.*]]) #[[ATTR0]] {
+; CHECK-NEXT:    [[PTR:%.*]] = call align 8 ptr addrspace(7) @llvm.amdgcn.make.buffer.rsrc.p7.p0(ptr align 8 [[P]], i16 0, i64 0, i32 0)
+; CHECK-NEXT:    [[LOADED:%.*]] = load float, ptr addrspace(7) [[PTR]], align 4
+; CHECK-NEXT:    ret float [[LOADED]]
+;
+  %ptr = call ptr addrspace(7) @llvm.amdgcn.make.buffer.rsrc.p7.p0(ptr %p, i16 0, i64 0, i32 0)
+  %loaded = load float, ptr addrspace(7) %ptr, align 4
+  ret float %loaded
+}
diff --git a/llvm/test/Transforms/Attributor/AMDGPU/tag-invariant-loads.ll b/llvm/test/Transforms/Attributor/AMDGPU/tag-invariant-loads.ll
index 1ab607465dbbb..34bbfa8974747 100644
--- a/llvm/test/Transforms/Attributor/AMDGPU/tag-invariant-loads.ll
+++ b/llvm/test/Transforms/Attributor/AMDGPU/tag-invariant-loads.ll
@@ -306,7 +306,7 @@ define amdgpu_kernel void @test_call_untouched_ptr() {
 define amdgpu_kernel void @test_make_buffer(ptr addrspace(1) %ptr) {
 ; AMDGCN-LABEL: define amdgpu_kernel void @test_make_buffer(
 ; AMDGCN-SAME: ptr addrspace(1) nofree readonly captures(none) [[PTR:%.*]]) #[[ATTR2]] {
-; AMDGCN-NEXT:    [[RSRC:%.*]] = call align 4 ptr addrspace(7) @llvm.amdgcn.make.buffer.rsrc.p7.p1(ptr addrspace(1) [[PTR]], i16 noundef 0, i64 noundef 0, i32 noundef 0) #[[ATTR11:[0-9]+]]
+; AMDGCN-NEXT:    [[RSRC:%.*]] = call ptr addrspace(7) @llvm.amdgcn.make.buffer.rsrc.p7.p1(ptr addrspace(1) [[PTR]], i16 noundef 0, i64 noundef 0, i32 noundef 0) #[[ATTR11:[0-9]+]]
 ; AMDGCN-NEXT:    [[VAL:%.*]] = load i32, ptr addrspace(7) [[RSRC]], align 4
 ; AMDGCN-NEXT:    call void @clobber(i32 [[VAL]]) #[[ATTR7]]
 ; AMDGCN-NEXT:    ret void
@@ -321,7 +321,7 @@ define amdgpu_kernel void @test_make_buffer(ptr addrspace(1) %ptr) {
 define amdgpu_kernel void @test_make_buffer_noalias(ptr addrspace(1) noalias %ptr) {
 ; AMDGCN-LABEL: define amdgpu_kernel void @test_make_buffer_noalias(
 ; AMDGCN-SAME: ptr addrspace(1) noalias nofree readonly captures(none) [[PTR:%.*]]) #[[ATTR2]] {
-; AMDGCN-NEXT:    [[RSRC:%.*]] = call align 4 ptr addrspace(7) @llvm.amdgcn.make.buffer.rsrc.p7.p1(ptr addrspace(1) [[PTR]], i16 noundef 0, i64 noundef 0, i32 noundef 0) #[[ATTR11]]
+; AMDGCN-NEXT:    [[RSRC:%.*]] = call ptr addrspace(7) @llvm.amdgcn.make.buffer.rsrc.p7.p1(ptr addrspace(1) [[PTR]], i16 noundef 0, i64 noundef 0, i32 noundef 0) #[[ATTR11]]
 ; AMDGCN-NEXT:    [[VAL:%.*]] = load i32, ptr addrspace(7) [[RSRC]], align 4, !invariant.load [[META0]]
 ; AMDGCN-NEXT:    call void @clobber(i32 [[VAL]]) #[[ATTR7]]
 ; AMDGCN-NEXT:    ret void

shiltian

I don't think we should put the handling of AMDGPU specific code into the generic code. We can potentially create a class inheriting the existing ones in AMDGPUAttributor dedicated for the handling of AMDGPU specific stuff.

arsenm · 2025-11-07T22:24:17Z

I don't think we should put the handling of AMDGPU specific code into the generic code. We can potentially create a class inheriting the existing ones in AMDGPUAttributor dedicated for the handling of AMDGPU specific stuff.

AMDGPUAttributor isn't really the place for it either. It's not an AMDGPU specific attribute

arsenm · 2025-11-07T22:24:39Z

Title should make it clear this is about inferring it, not changing the intrinsic definition

arsenm · 2025-11-07T22:25:24Z

llvm/lib/Transforms/IPO/AttributorAttributes.cpp

+        const auto *AlignAA =
+            A.getAAFor<AAAlign>(*this, IRPosition::value(*(II->getOperand(0))),
+                                DepClassTy::REQUIRED);
+        if (AlignAA && AlignAA->isValidState())


Does TargetTransformInfo have some kind of alignment propagation already? I thought it did

Hi @arsenm , I had a look but cannot be sure. There are lots of align related function but mainly used for legality check and cost computation.

I'm not really familiar with the struct, if you could be more specific?? So that I can have some directions to search~~

Thanks

shiltian · 2025-11-07T23:19:17Z

I don't think we should put the handling of AMDGPU specific code into the generic code. We can potentially create a class inheriting the existing ones in AMDGPUAttributor dedicated for the handling of AMDGPU specific stuff.

AMDGPUAttributor isn't really the place for it either. It's not an AMDGPU specific attribute

It is an AMDGPU specific intrinsic.

krzysz00 · 2025-11-11T17:49:54Z

I'd like to flag #167553 as related (and to make sure we're on the same page as to what we mean by align on these complex pointers)

shiltian · 2025-11-12T02:19:29Z

llvm/lib/Target/AMDGPU/AMDGPUAttributor.cpp

  llvm_unreachable("AAAMDGPUClusterDims is only valid for function position");
 }

+struct AAAMDGPUMakeBufferRsrcAlign


I'd make it something like AAAMDGPUAlign, and then use it to deal with all AMDGPU related alignments.

Also, document the new class.

arsenm · 2025-11-12T03:29:11Z

It is an AMDGPU specific intrinsic.

That does not make the transform AMDGPU specific. This is applying target intrinsic knowledge to a generic intrinsic. The handling should be directly in AAAlign. I would rank handling it as an AMDGPU specific Attributor significantly worse than just hardcoding the target intrinsic in AAAlign. Better would be to have TTI handle the relevant parsing

arsenm · 2025-11-12T03:31:41Z

We probably could use the TTI information from #140802 to get the alignment

krzysz00

I'm with @arsenm on "this goes in the generic align handling"

Overall, can we see a few more test cases - a load/store that is underaligned and a function argument with aligns on it, for example.

I'd also like to see (especially after my docs PR lands) a note somewhere in the code that this is a conservatively correct approach to this alignment inference.

krzysz00 · 2025-11-18T15:49:22Z

The pointer operand could be a function argument or a GEP result or ... anything you can do to a pointer, really.

I think the simplest thing to do would be to say that llvm.amdgpu.make.buffer.rsrc preserves the alignment of its argument.

Therefore, if I have a align(1) input to make.buffer.rsrc, that should make all loads from/stores to it align 1 as well (though the attributor could propagate things backwards, which is fine actually).

So I think that adding generic handling for "this returns an existing pointer without capturing" might be the right call

shiltian · 2025-11-18T17:23:53Z

So I think that adding generic handling for "this returns an existing pointer without capturing" might be the right call

In the previous PR that handles the ptrmask, in an offline discussion with @Shoreshen at one point, I recommended to introduce a call back (not using the simplified value call back) to tell AAAlign that, the alignment of this value is same as something else. With this call back, I'd imagine we don't need special handling in the generic code, because we just need to say, if the value is llvm.amdgpu.make.buffer.rsrc, its alignment is same as its pointer operand, and then the generic AA would just query the pointer operand.

krzysz00 · 2025-11-19T01:45:27Z

The one question is do we want the following

define float @overaligned(ptr addrspace(1) align(2) inreg %x, i32 inreg %off) {
  %rsrc = call ptr addrspace(7) @llvm.amdgcn.make.buffer.rsrc(%x, ...)
  %spot = getelementptr i8, ptr addrspace(7) %rsrc, i32 %off
  ;;; UB! This load is "align 4" but the base pointer is only known to be aligned to 2
  ;;; Because both the base and `%off` are workgroup-uniform, this `load` is (though we don't do
  ;;; this atm) promotable to s_buffer_load, where the last two bits of `%x`'s address would be silently
  ;;; dropped.
  %ret = load float, ptr addrspace(7) %spot, align 4, !invariant.load
  ret float %ret
}

to just stay as UB or do we want to fix it to be align 2 instead?

shiltian · 2025-11-19T01:51:41Z

The attributor will change the alignment of %x to 4. I think it is safe to do so as well, otherwise it is UB, and since it is UB, it is also safe to do so. :-D

github-actions · 2025-11-20T08:25:31Z

🐧 Linux x64 Test Results

187097 tests passed
4929 tests skipped

✅ The build succeeded and all tests passed.

shiltian · 2025-12-01T03:03:49Z

llvm/lib/Transforms/IPO/AttributorAttributes.cpp

            A.getAAFor<AAAlign>(*this, IRPosition::value(*(II->getOperand(0))),
                                DepClassTy::REQUIRED);
-        if (AlignAA && AlignAA->isValidState()) {
+        if (AlignAA) {


not sure about this change

Hi @shiltian , if I'm not wrong the AAAlign would be invalid if assumed alignment is 1:

/// See AbstractState::isValidState() /// NOTE: For now we simply pretend that the worst possible state is invalid. bool isValidState() const override { return Assumed != getWorstState(); }

In this case, if mask is not valid, then assumed alignment of ptrmask should also be 1...

llvm/lib/Target/AMDGPU/AMDGPUAttributor.cpp

Co-authored-by: Shilei Tian <[email protected]>

github-actions · 2025-12-02T01:38:30Z

✅ With the latest revision this PR passed the C/C++ code formatter.

shiltian · 2025-12-04T17:34:13Z

llvm/lib/Transforms/IPO/AttributorAttributes.cpp

        return AlignAA->getKnownAlign().value();
      break;
    }
+    case Intrinsic::amdgcn_make_buffer_rsrc: {


add a comment here regarding the handling of target specific handling and some future direction that we might take.

llvm/lib/Transforms/IPO/AttributorAttributes.cpp

Co-authored-by: Shilei Tian <[email protected]>

llvm-ci · 2025-12-08T04:52:07Z

LLVM Buildbot has detected a new failure on builder ppc64le-mlir-rhel-clang running on ppc64le-mlir-rhel-test while building llvm at step 2 "checkout".

Full details are available at: https://lab.llvm.org/buildbot/#/builders/129/builds/34534

Here is the relevant piece of the build log for the reference

Step 2 (checkout) failure: update (failure)
git version 2.43.5
fatal: unable to access 'https://github.com/llvm/llvm-project.git/': Could not resolve host: github.com
fatal: unable to access 'https://github.com/llvm/llvm-project.git/': Could not resolve host: github.com

llvm-ci · 2025-12-08T05:43:40Z

LLVM Buildbot has detected a new failure on builder sanitizer-x86_64-linux-fast running on sanitizer-buildbot4 while building llvm at step 2 "annotate".

Full details are available at: https://lab.llvm.org/buildbot/#/builders/169/builds/17785

Here is the relevant piece of the build log for the reference

Step 2 (annotate) failure: 'python ../sanitizer_buildbot/sanitizers/zorg/buildbot/builders/sanitizers/buildbot_selector.py' (failure)
...
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/llvm/config.py:564: note: using lld-link: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/lld-link
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/llvm/config.py:564: note: using ld64.lld: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/ld64.lld
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/llvm/config.py:564: note: using wasm-ld: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/wasm-ld
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/llvm/config.py:564: note: using ld.lld: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/ld.lld
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/llvm/config.py:564: note: using lld-link: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/lld-link
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/llvm/config.py:564: note: using ld64.lld: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/ld64.lld
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/llvm/config.py:564: note: using wasm-ld: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/wasm-ld
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/main.py:74: note: The test suite configuration requested an individual test timeout of 0 seconds but a timeout of 900 seconds was requested on the command line. Forcing timeout to be 900 seconds.
-- Testing: 94421 tests, 64 workers --
Testing:  0.. 10.. 20.. 30.. 40.. 50.. 60.. 70.. 80.. 90
FAIL: LLVM :: ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll (62803 of 94421)
******************** TEST 'LLVM :: ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll' FAILED ********************
Exit Code: 1

Command Output (stdout):
--
# RUN: at line 3
/home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/lli -jit-kind=orc-lazy -orc-lazy-debug=funcs-to-stdout -extra-module /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll    /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/Inputs/noop-main.ll | /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/FileCheck /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll
# executed command: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/lli -jit-kind=orc-lazy -orc-lazy-debug=funcs-to-stdout -extra-module /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/Inputs/noop-main.ll
# .---command stderr------------
# | JIT session error: In graph /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll.submodule.0x9c8b1f1241cb0194.ll-jitted-objectbuffer, section .text: relocation target 0x7ca8d9ad302c (__orc_lcl.str3.3:0x7ca8d9ad3030 + 0xfffffffffffffffc) is out of range of Delta32 fixup at address 0x7ca8d9ad3030 (printf_wrapper, 0x78a8d869d000 + 0x3)
# | JIT session error: Failed to materialize symbols: { (main.impl, { printf_wrapper }) }
# `-----------------------------
# error: command failed with exit status: 1
# executed command: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/FileCheck /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll
# .---command stderr------------
# | /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll:16:10: error: CHECK: expected string not found in input
# | ; CHECK: Goodbye from destructor
# |          ^
# | <stdin>:13:26: note: scanning from here
# | Goodbye from __cxa_atexit
# |                          ^
# | <stdin>:14:3: note: possible intended match here
# | [ printf_wrapper ]
# |   ^
# | 
# | Input file: <stdin>
# | Check file: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll
# | 
# | -dump-input=help explains the following input dump.
# | 
# | Input was:
# | <<<<<<
# |             .
# |             .
# |             .
# |             8: [ main ] 
# |             9: [ __lljit_run_atexits atexit ] 
# |            10: [ atexit_handler ] 
Step 10 (stage2/asan_ubsan check) failure: stage2/asan_ubsan check (failure)
...
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/llvm/config.py:564: note: using lld-link: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/lld-link
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/llvm/config.py:564: note: using ld64.lld: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/ld64.lld
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/llvm/config.py:564: note: using wasm-ld: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/wasm-ld
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/llvm/config.py:564: note: using ld.lld: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/ld.lld
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/llvm/config.py:564: note: using lld-link: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/lld-link
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/llvm/config.py:564: note: using ld64.lld: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/ld64.lld
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/llvm/config.py:564: note: using wasm-ld: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/wasm-ld
llvm-lit: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/utils/lit/lit/main.py:74: note: The test suite configuration requested an individual test timeout of 0 seconds but a timeout of 900 seconds was requested on the command line. Forcing timeout to be 900 seconds.
-- Testing: 94421 tests, 64 workers --
Testing:  0.. 10.. 20.. 30.. 40.. 50.. 60.. 70.. 80.. 90
FAIL: LLVM :: ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll (62803 of 94421)
******************** TEST 'LLVM :: ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll' FAILED ********************
Exit Code: 1

Command Output (stdout):
--
# RUN: at line 3
/home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/lli -jit-kind=orc-lazy -orc-lazy-debug=funcs-to-stdout -extra-module /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll    /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/Inputs/noop-main.ll | /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/FileCheck /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll
# executed command: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/lli -jit-kind=orc-lazy -orc-lazy-debug=funcs-to-stdout -extra-module /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/Inputs/noop-main.ll
# .---command stderr------------
# | JIT session error: In graph /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll.submodule.0x9c8b1f1241cb0194.ll-jitted-objectbuffer, section .text: relocation target 0x7ca8d9ad302c (__orc_lcl.str3.3:0x7ca8d9ad3030 + 0xfffffffffffffffc) is out of range of Delta32 fixup at address 0x7ca8d9ad3030 (printf_wrapper, 0x78a8d869d000 + 0x3)
# | JIT session error: Failed to materialize symbols: { (main.impl, { printf_wrapper }) }
# `-----------------------------
# error: command failed with exit status: 1
# executed command: /home/b/sanitizer-x86_64-linux-fast/build/llvm_build_asan_ubsan/bin/FileCheck /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll
# .---command stderr------------
# | /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll:16:10: error: CHECK: expected string not found in input
# | ; CHECK: Goodbye from destructor
# |          ^
# | <stdin>:13:26: note: scanning from here
# | Goodbye from __cxa_atexit
# |                          ^
# | <stdin>:14:3: note: possible intended match here
# | [ printf_wrapper ]
# |   ^
# | 
# | Input file: <stdin>
# | Check file: /home/b/sanitizer-x86_64-linux-fast/build/llvm-project/llvm/test/ExecutionEngine/OrcLazy/global-ctors-and-dtors.ll
# | 
# | -dump-input=help explains the following input dump.
# | 
# | Input was:
# | <<<<<<
# |             .
# |             .
# |             .
# |             8: [ main ] 
# |             9: [ __lljit_run_atexits atexit ] 
# |            10: [ atexit_handler ]

@foo

Calculating alignment for `make.buffer.rsrc` intrinsic. The logic is the alignment on use of return value of `make.buffer.rsrc` should be capped by the base operand's alignment of `make.buffer.rsrc`. For example: ```ll define float @foo(ptr addrspace(1) align X %ptr) { %fat.ptr = call ptr addrspace(7) @llvm.amdgcn.make.buffer.rsrc.p7.p1(ptr addrspace(1) %ptr, i16 0, i32 C, i32 0) %y = load float, ptr addrspace(7) %fat.ptr, align Y ret float %y } ``` We hopes that `Y = min(X, Y)` --- After discussion, it seems improper for letting `Y = min(X, Y)` since it contradict with the semantic of align on load. So we would apply the origin behavior of align, which is letting `X` and `Y` both equal to `max(X, Y)` --------- Co-authored-by: Shilei Tian <[email protected]>

Apply alignment attr for make.buffer.rsrc

4d3d6e4

llvmbot added backend:AMDGPU llvm:transforms labels Nov 7, 2025

Shoreshen requested review from arsenm and shiltian and removed request for arsenm November 7, 2025 09:57

Shoreshen requested review from arsenm and krzysz00 November 7, 2025 09:57

shiltian requested changes Nov 7, 2025

View reviewed changes

arsenm reviewed Nov 7, 2025

View reviewed changes

Shoreshen added 5 commits November 10, 2025 10:03

fix format error

505426b

Merge branch 'main' into add-align-for-make.buffer-intrinsic-v2

4245ca5

Merge branch 'main' into add-align-for-make.buffer-intrinsic-v2

07415ef

Merge branch 'main' into add-align-for-make.buffer-intrinsic-v2

841bbe5

Addr 0 should have max alignment

7be66a0

llvmbot added the clang Clang issues not falling into any other category label Nov 10, 2025

Shoreshen added 2 commits November 11, 2025 16:10

Move to amd specific attribute

5efe07b

fix failed test

9d04645

Shoreshen requested review from arsenm and shiltian November 12, 2025 01:02

Merge branch 'main' into add-align-for-make.buffer-intrinsic-v2

5e3479c

shiltian reviewed Nov 12, 2025

View reviewed changes

krzysz00 reviewed Nov 12, 2025

View reviewed changes

Merge branch 'main' into add-align-for-make.buffer-intrinsic-v2

ff6c8d7

Shoreshen added 5 commits November 24, 2025 09:11

Merge branch 'main' into add-align-for-make.buffer-intrinsic-v2

a5a8b66

Merge branch 'main' into add-align-for-make.buffer-intrinsic-v2

989017e

moving to general intrinsic handling in attribute

a8792cc

fix test case

19d5915

Merge branch 'main' into add-align-for-make.buffer-intrinsic-v2

015e701

shiltian reviewed Dec 1, 2025

View reviewed changes

Shoreshen and others added 2 commits December 2, 2025 09:27

Merge branch 'main' into add-align-for-make.buffer-intrinsic-v2

4aa04b1

Update llvm/lib/Target/AMDGPU/AMDGPUAttributor.cpp

09d4a9b

Co-authored-by: Shilei Tian <[email protected]>

Shoreshen added 2 commits December 2, 2025 10:46

fix format

5af566a

Merge branch 'main' into add-align-for-make.buffer-intrinsic-v2

677876b

Shoreshen requested a review from shiltian December 4, 2025 01:02

Merge branch 'main' into add-align-for-make.buffer-intrinsic-v2

96f5892

shiltian reviewed Dec 4, 2025

View reviewed changes

Shoreshen added 2 commits December 5, 2025 09:02

Merge branch 'main' into add-align-for-make.buffer-intrinsic-v2

68c8e42

Add comments

b4bdc67

shiltian approved these changes Dec 5, 2025

View reviewed changes

llvm/lib/Transforms/IPO/AttributorAttributes.cpp Outdated Show resolved Hide resolved

Shoreshen and others added 3 commits December 5, 2025 12:06

Update llvm/lib/Transforms/IPO/AttributorAttributes.cpp

d17d04c

Co-authored-by: Shilei Tian <[email protected]>

Merge branch 'main' into add-align-for-make.buffer-intrinsic-v2

7431be9

Merge branch 'main' into add-align-for-make.buffer-intrinsic-v2

d72fa3a

Shoreshen merged commit e442904 into llvm:main Dec 8, 2025
10 checks passed

[AMDGPU] Apply alignment attr for make.buffer.rsrc #166914

[AMDGPU] Apply alignment attr for make.buffer.rsrc #166914

Uh oh!

Conversation

Shoreshen commented Nov 7, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

llvmbot commented Nov 7, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

shiltian left a comment

Choose a reason for hiding this comment

Uh oh!

arsenm commented Nov 7, 2025

Uh oh!

arsenm commented Nov 7, 2025

Uh oh!

arsenm Nov 7, 2025

Choose a reason for hiding this comment

Uh oh!

Shoreshen Nov 11, 2025

Choose a reason for hiding this comment

Uh oh!

shiltian commented Nov 7, 2025

Uh oh!

krzysz00 commented Nov 11, 2025

Uh oh!

shiltian Nov 12, 2025

Choose a reason for hiding this comment

Uh oh!

shiltian Nov 12, 2025

Choose a reason for hiding this comment

Uh oh!

arsenm commented Nov 12, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

arsenm commented Nov 12, 2025

Uh oh!

krzysz00 left a comment

Choose a reason for hiding this comment

Uh oh!

krzysz00 commented Nov 18, 2025

Uh oh!

shiltian commented Nov 18, 2025

Uh oh!

krzysz00 commented Nov 19, 2025

Uh oh!

shiltian commented Nov 19, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

github-actions bot commented Nov 20, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

🐧 Linux x64 Test Results

Uh oh!

shiltian Dec 1, 2025

Choose a reason for hiding this comment

Uh oh!

Shoreshen Dec 2, 2025

Choose a reason for hiding this comment

Uh oh!

Uh oh!

github-actions bot commented Dec 2, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

shiltian Dec 4, 2025

Choose a reason for hiding this comment

Uh oh!

Uh oh!

Uh oh!

llvm-ci commented Dec 8, 2025

Uh oh!

llvm-ci commented Dec 8, 2025

Uh oh!

Reviewers

Assignees

Labels

Projects

Milestone

Development

Uh oh!

Shoreshen commented Nov 7, 2025 •

edited

Loading

llvmbot commented Nov 7, 2025 •

edited

Loading

arsenm commented Nov 12, 2025 •

edited

Loading

shiltian commented Nov 19, 2025 •

edited

Loading

github-actions bot commented Nov 20, 2025 •

edited

Loading

github-actions bot commented Dec 2, 2025 •

edited

Loading