Mercurial > hg > CbC > CbC_llvm
view llvm/test/CodeGen/AMDGPU/local-stack-slot-offset.ll @ 266:00f31e85ec16 default tip
Added tag current for changeset 31d058e83c98
author | Shinji KONO <kono@ie.u-ryukyu.ac.jp> |
---|---|
date | Sat, 14 Oct 2023 10:13:55 +0900 |
parents | 1f2b6ac9f198 |
children |
line wrap: on
line source
;RUN: llc < %s -march=amdgcn -mcpu=verde -mattr=-promote-alloca -verify-machineinstrs | FileCheck %s -check-prefix=CHECK ;RUN: llc < %s -march=amdgcn -mcpu=tonga -mattr=-flat-for-global -mattr=-promote-alloca -verify-machineinstrs | FileCheck %s -check-prefix=CHECK ; Allocate two stack slots of 2052 bytes each requiring a total of 4104 bytes. ; Extracting the last element of each does not fit into the offset field of ; MUBUF instructions, so a new base register is needed. This used to not ; happen, leading to an assertion. ; CHECK-LABEL: {{^}}main: ; CHECK: buffer_store_dword ; CHECK: buffer_store_dword ; CHECK: buffer_load_dword ; CHECK: buffer_load_dword define amdgpu_gs float @main(float %v1, float %v2, i32 %idx1, i32 %idx2) { main_body: %m1 = alloca [513 x float], addrspace(5) %m2 = alloca [513 x float], addrspace(5) %gep1.store = getelementptr [513 x float], ptr addrspace(5) %m1, i32 0, i32 %idx1 store float %v1, ptr addrspace(5) %gep1.store %gep2.store = getelementptr [513 x float], ptr addrspace(5) %m2, i32 0, i32 %idx2 store float %v2, ptr addrspace(5) %gep2.store ; This used to use a base reg equal to 0. %out1 = load float, ptr addrspace(5) %m1 ; This used to attempt to re-use the base reg at 0, generating an out-of-bounds instruction offset. %gep2.load = getelementptr [513 x float], ptr addrspace(5) %m2, i32 0, i32 512 %out2 = load float, ptr addrspace(5) %gep2.load %r = fadd float %out1, %out2 ret float %r }