@@ -430,36 +430,36 @@ define ptr @gep_disjoint_or(ptr %base) {
430
430
431
431
; Check that AssertAlign nodes between ptradd nodes don't block offset folding,
432
432
; taken from preload-implicit-kernargs.ll
433
- define amdgpu_kernel void @random_incorrect_offset (ptr addrspace (1 ) inreg %out ) # 0 {
433
+ define amdgpu_kernel void @random_incorrect_offset (ptr addrspace (1 ) inreg %out ) {
434
434
; GFX942_PTRADD-LABEL: random_incorrect_offset:
435
435
; GFX942_PTRADD: ; %bb.1:
436
- ; GFX942_PTRADD-NEXT: s_load_dwordx2 s[2:3 ], s[0:1 ], 0x0
436
+ ; GFX942_PTRADD-NEXT: s_load_dwordx2 s[8:9 ], s[4:5 ], 0x0
437
437
; GFX942_PTRADD-NEXT: s_waitcnt lgkmcnt(0)
438
438
; GFX942_PTRADD-NEXT: s_branch .LBB21_0
439
439
; GFX942_PTRADD-NEXT: .p2align 8
440
440
; GFX942_PTRADD-NEXT: ; %bb.2:
441
441
; GFX942_PTRADD-NEXT: .LBB21_0:
442
- ; GFX942_PTRADD-NEXT: s_load_dword s0, s[0:1 ], 0xa
442
+ ; GFX942_PTRADD-NEXT: s_load_dword s0, s[4:5 ], 0xa
443
443
; GFX942_PTRADD-NEXT: v_mov_b32_e32 v0, 0
444
444
; GFX942_PTRADD-NEXT: s_waitcnt lgkmcnt(0)
445
445
; GFX942_PTRADD-NEXT: v_mov_b32_e32 v1, s0
446
- ; GFX942_PTRADD-NEXT: global_store_dword v0, v1, s[2:3 ]
446
+ ; GFX942_PTRADD-NEXT: global_store_dword v0, v1, s[8:9 ]
447
447
; GFX942_PTRADD-NEXT: s_endpgm
448
448
;
449
449
; GFX942_LEGACY-LABEL: random_incorrect_offset:
450
450
; GFX942_LEGACY: ; %bb.1:
451
- ; GFX942_LEGACY-NEXT: s_load_dwordx2 s[2:3 ], s[0:1 ], 0x0
451
+ ; GFX942_LEGACY-NEXT: s_load_dwordx2 s[8:9 ], s[4:5 ], 0x0
452
452
; GFX942_LEGACY-NEXT: s_waitcnt lgkmcnt(0)
453
453
; GFX942_LEGACY-NEXT: s_branch .LBB21_0
454
454
; GFX942_LEGACY-NEXT: .p2align 8
455
455
; GFX942_LEGACY-NEXT: ; %bb.2:
456
456
; GFX942_LEGACY-NEXT: .LBB21_0:
457
- ; GFX942_LEGACY-NEXT: s_mov_b32 s4 , 8
458
- ; GFX942_LEGACY-NEXT: s_load_dword s0, s[0:1 ], s4 offset:0x2
457
+ ; GFX942_LEGACY-NEXT: s_mov_b32 s0 , 8
458
+ ; GFX942_LEGACY-NEXT: s_load_dword s0, s[4:5 ], s0 offset:0x2
459
459
; GFX942_LEGACY-NEXT: v_mov_b32_e32 v0, 0
460
460
; GFX942_LEGACY-NEXT: s_waitcnt lgkmcnt(0)
461
461
; GFX942_LEGACY-NEXT: v_mov_b32_e32 v1, s0
462
- ; GFX942_LEGACY-NEXT: global_store_dword v0, v1, s[2:3 ]
462
+ ; GFX942_LEGACY-NEXT: global_store_dword v0, v1, s[8:9 ]
463
463
; GFX942_LEGACY-NEXT: s_endpgm
464
464
%imp_arg_ptr = call ptr addrspace (4 ) @llvm.amdgcn.implicitarg.ptr ()
465
465
%gep = getelementptr i8 , ptr addrspace (4 ) %imp_arg_ptr , i32 2
@@ -471,5 +471,3 @@ define amdgpu_kernel void @random_incorrect_offset(ptr addrspace(1) inreg %out)
471
471
declare void @llvm.memcpy.p0.p4.i64 (ptr noalias nocapture writeonly , ptr addrspace (4 ) noalias nocapture readonly , i64 , i1 immarg)
472
472
473
473
!0 = !{}
474
-
475
- attributes #0 = { "amdgpu-agpr-alloc" ="0" "amdgpu-no-completion-action" "amdgpu-no-default-queue" "amdgpu-no-dispatch-id" "amdgpu-no-dispatch-ptr" "amdgpu-no-heap-ptr" "amdgpu-no-hostcall-ptr" "amdgpu-no-lds-kernel-id" "amdgpu-no-multigrid-sync-arg" "amdgpu-no-queue-ptr" "amdgpu-no-workgroup-id-x" "amdgpu-no-workgroup-id-y" "amdgpu-no-workgroup-id-z" "amdgpu-no-workitem-id-x" "amdgpu-no-workitem-id-y" "amdgpu-no-workitem-id-z" "uniform-work-group-size" ="false" }
0 commit comments