@@ -1295,8 +1295,7 @@ define amdgpu_ps float @mubuf_atomicrmw_sgpr_ptr_offset4095(ptr addrspace(1) inr
12951295; GFX12-NEXT: v_dual_mov_b32 v0, 2 :: v_dual_mov_b32 v1, 0
12961296; GFX12-NEXT: global_atomic_add_u32 v0, v1, v0, s[2:3] offset:16380 th:TH_ATOMIC_RETURN
12971297; GFX12-NEXT: s_waitcnt vmcnt(0)
1298- ; GFX12-NEXT: buffer_gl0_inv
1299- ; GFX12-NEXT: buffer_gl1_inv
1298+ ; GFX12-NEXT: global_inv scope:SCOPE_DEV
13001299; GFX12-NEXT: ; return to shader part epilog
13011300 %gep = getelementptr i32 , ptr addrspace (1 ) %ptr , i64 4095
13021301 %result = atomicrmw add ptr addrspace (1 ) %gep , i32 2 syncscope("agent" ) seq_cst
@@ -1347,8 +1346,7 @@ define amdgpu_ps float @mubuf_atomicrmw_sgpr_ptr_offset4294967296(ptr addrspace(
13471346; GFX12-NEXT: v_mov_b32_e32 v2, 2
13481347; GFX12-NEXT: global_atomic_add_u32 v0, v[0:1], v2, off th:TH_ATOMIC_RETURN
13491348; GFX12-NEXT: s_waitcnt vmcnt(0)
1350- ; GFX12-NEXT: buffer_gl0_inv
1351- ; GFX12-NEXT: buffer_gl1_inv
1349+ ; GFX12-NEXT: global_inv scope:SCOPE_DEV
13521350; GFX12-NEXT: ; return to shader part epilog
13531351 %gep = getelementptr i32 , ptr addrspace (1 ) %ptr , i64 4294967296
13541352 %result = atomicrmw add ptr addrspace (1 ) %gep , i32 2 syncscope("agent" ) seq_cst
@@ -1389,8 +1387,7 @@ define amdgpu_ps float @mubuf_atomicrmw_vgpr_ptr_offset4095(ptr addrspace(1) %pt
13891387; GFX12-NEXT: v_mov_b32_e32 v2, 2
13901388; GFX12-NEXT: global_atomic_add_u32 v0, v[0:1], v2, off offset:16380 th:TH_ATOMIC_RETURN
13911389; GFX12-NEXT: s_waitcnt vmcnt(0)
1392- ; GFX12-NEXT: buffer_gl0_inv
1393- ; GFX12-NEXT: buffer_gl1_inv
1390+ ; GFX12-NEXT: global_inv scope:SCOPE_DEV
13941391; GFX12-NEXT: ; return to shader part epilog
13951392 %gep = getelementptr i32 , ptr addrspace (1 ) %ptr , i64 4095
13961393 %result = atomicrmw add ptr addrspace (1 ) %gep , i32 2 syncscope("agent" ) seq_cst
@@ -1438,8 +1435,7 @@ define amdgpu_ps float @mubuf_atomicrmw_vgpr_ptr_offset4294967296(ptr addrspace(
14381435; GFX12-NEXT: v_mov_b32_e32 v2, 2
14391436; GFX12-NEXT: global_atomic_add_u32 v0, v[0:1], v2, off th:TH_ATOMIC_RETURN
14401437; GFX12-NEXT: s_waitcnt vmcnt(0)
1441- ; GFX12-NEXT: buffer_gl0_inv
1442- ; GFX12-NEXT: buffer_gl1_inv
1438+ ; GFX12-NEXT: global_inv scope:SCOPE_DEV
14431439; GFX12-NEXT: ; return to shader part epilog
14441440 %gep = getelementptr i32 , ptr addrspace (1 ) %ptr , i64 4294967296
14451441 %result = atomicrmw add ptr addrspace (1 ) %gep , i32 2 syncscope("agent" ) seq_cst
@@ -1491,8 +1487,7 @@ define amdgpu_ps float @mubuf_atomicrmw_sgpr_ptr_vgpr_offset(ptr addrspace(1) in
14911487; GFX12-NEXT: v_add_co_ci_u32_e32 v1, vcc_lo, v3, v1, vcc_lo
14921488; GFX12-NEXT: global_atomic_add_u32 v0, v[0:1], v4, off th:TH_ATOMIC_RETURN
14931489; GFX12-NEXT: s_waitcnt vmcnt(0)
1494- ; GFX12-NEXT: buffer_gl0_inv
1495- ; GFX12-NEXT: buffer_gl1_inv
1490+ ; GFX12-NEXT: global_inv scope:SCOPE_DEV
14961491; GFX12-NEXT: ; return to shader part epilog
14971492 %gep = getelementptr i32 , ptr addrspace (1 ) %ptr , i32 %voffset
14981493 %result = atomicrmw add ptr addrspace (1 ) %gep , i32 2 syncscope("agent" ) seq_cst
@@ -1536,8 +1531,7 @@ define amdgpu_ps float @mubuf_cmpxchg_sgpr_ptr_offset4095(ptr addrspace(1) inreg
15361531; GFX12-NEXT: v_mov_b32_e32 v0, 0
15371532; GFX12-NEXT: global_atomic_cmpswap_b32 v0, v0, v[1:2], s[2:3] offset:16380 th:TH_ATOMIC_RETURN
15381533; GFX12-NEXT: s_waitcnt vmcnt(0)
1539- ; GFX12-NEXT: buffer_gl0_inv
1540- ; GFX12-NEXT: buffer_gl1_inv
1534+ ; GFX12-NEXT: global_inv scope:SCOPE_DEV
15411535; GFX12-NEXT: ; return to shader part epilog
15421536 %gep = getelementptr i32 , ptr addrspace (1 ) %ptr , i64 4095
15431537 %result.struct = cmpxchg ptr addrspace (1 ) %gep , i32 %old , i32 %in syncscope("agent" ) seq_cst seq_cst
@@ -1590,8 +1584,7 @@ define amdgpu_ps float @mubuf_cmpxchg_sgpr_ptr_offset4294967296(ptr addrspace(1)
15901584; GFX12-NEXT: v_dual_mov_b32 v4, s1 :: v_dual_mov_b32 v3, s0
15911585; GFX12-NEXT: global_atomic_cmpswap_b32 v0, v[3:4], v[1:2], off th:TH_ATOMIC_RETURN
15921586; GFX12-NEXT: s_waitcnt vmcnt(0)
1593- ; GFX12-NEXT: buffer_gl0_inv
1594- ; GFX12-NEXT: buffer_gl1_inv
1587+ ; GFX12-NEXT: global_inv scope:SCOPE_DEV
15951588; GFX12-NEXT: ; return to shader part epilog
15961589 %gep = getelementptr i32 , ptr addrspace (1 ) %ptr , i64 4294967296
15971590 %result.struct = cmpxchg ptr addrspace (1 ) %gep , i32 %old , i32 %in syncscope("agent" ) seq_cst seq_cst
@@ -1633,8 +1626,7 @@ define amdgpu_ps float @mubuf_cmpxchg_vgpr_ptr_offset4095(ptr addrspace(1) %ptr,
16331626; GFX12-NEXT: v_mov_b32_e32 v4, v2
16341627; GFX12-NEXT: global_atomic_cmpswap_b32 v0, v[0:1], v[3:4], off offset:16380 th:TH_ATOMIC_RETURN
16351628; GFX12-NEXT: s_waitcnt vmcnt(0)
1636- ; GFX12-NEXT: buffer_gl0_inv
1637- ; GFX12-NEXT: buffer_gl1_inv
1629+ ; GFX12-NEXT: global_inv scope:SCOPE_DEV
16381630; GFX12-NEXT: ; return to shader part epilog
16391631 %gep = getelementptr i32 , ptr addrspace (1 ) %ptr , i64 4095
16401632 %result.struct = cmpxchg ptr addrspace (1 ) %gep , i32 %old , i32 %in syncscope("agent" ) seq_cst seq_cst
@@ -1682,8 +1674,7 @@ define amdgpu_ps float @mubuf_cmpxchg_vgpr_ptr_offset4294967296(ptr addrspace(1)
16821674; GFX12-NEXT: v_add_co_ci_u32_e32 v1, vcc_lo, v1, v6, vcc_lo
16831675; GFX12-NEXT: global_atomic_cmpswap_b32 v0, v[0:1], v[3:4], off th:TH_ATOMIC_RETURN
16841676; GFX12-NEXT: s_waitcnt vmcnt(0)
1685- ; GFX12-NEXT: buffer_gl0_inv
1686- ; GFX12-NEXT: buffer_gl1_inv
1677+ ; GFX12-NEXT: global_inv scope:SCOPE_DEV
16871678; GFX12-NEXT: ; return to shader part epilog
16881679 %gep = getelementptr i32 , ptr addrspace (1 ) %ptr , i64 4294967296
16891680 %result.struct = cmpxchg ptr addrspace (1 ) %gep , i32 %old , i32 %in syncscope("agent" ) seq_cst seq_cst
@@ -1736,8 +1727,7 @@ define amdgpu_ps float @mubuf_cmpxchg_sgpr_ptr_vgpr_offset(ptr addrspace(1) inre
17361727; GFX12-NEXT: v_add_co_ci_u32_e32 v1, vcc_lo, v5, v1, vcc_lo
17371728; GFX12-NEXT: global_atomic_cmpswap_b32 v0, v[0:1], v[2:3], off th:TH_ATOMIC_RETURN
17381729; GFX12-NEXT: s_waitcnt vmcnt(0)
1739- ; GFX12-NEXT: buffer_gl0_inv
1740- ; GFX12-NEXT: buffer_gl1_inv
1730+ ; GFX12-NEXT: global_inv scope:SCOPE_DEV
17411731; GFX12-NEXT: ; return to shader part epilog
17421732 %gep = getelementptr i32 , ptr addrspace (1 ) %ptr , i32 %voffset
17431733 %result.struct = cmpxchg ptr addrspace (1 ) %gep , i32 %old , i32 %in syncscope("agent" ) seq_cst seq_cst
0 commit comments