@@ -3563,15 +3563,19 @@ define amdgpu_kernel void @global_zextload_v64i16_to_v64i32(ptr addrspace(1) %ou
35633563; GCN-NOHSA-SI-NEXT:    buffer_store_dwordx4 v[16:19], off, s[0:3], 0 offset:32 
35643564; GCN-NOHSA-SI-NEXT:    buffer_store_dwordx4 v[23:26], off, s[0:3], 0 offset:48 
35653565; GCN-NOHSA-SI-NEXT:    buffer_load_dword v0, off, s[12:15], 0 offset:16 ; 4-byte Folded Reload 
3566+ ; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
35663567; GCN-NOHSA-SI-NEXT:    buffer_load_dword v1, off, s[12:15], 0 offset:20 ; 4-byte Folded Reload 
35673568; GCN-NOHSA-SI-NEXT:    buffer_load_dword v2, off, s[12:15], 0 offset:24 ; 4-byte Folded Reload 
3569+ ; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
35683570; GCN-NOHSA-SI-NEXT:    buffer_load_dword v3, off, s[12:15], 0 offset:28 ; 4-byte Folded Reload 
35693571; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
35703572; GCN-NOHSA-SI-NEXT:    buffer_store_dwordx4 v[0:3], off, s[0:3], 0 
35713573; GCN-NOHSA-SI-NEXT:    s_waitcnt expcnt(0) 
35723574; GCN-NOHSA-SI-NEXT:    buffer_load_dword v0, off, s[12:15], 0 ; 4-byte Folded Reload 
3575+ ; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
35733576; GCN-NOHSA-SI-NEXT:    buffer_load_dword v1, off, s[12:15], 0 offset:4 ; 4-byte Folded Reload 
35743577; GCN-NOHSA-SI-NEXT:    buffer_load_dword v2, off, s[12:15], 0 offset:8 ; 4-byte Folded Reload 
3578+ ; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
35753579; GCN-NOHSA-SI-NEXT:    buffer_load_dword v3, off, s[12:15], 0 offset:12 ; 4-byte Folded Reload 
35763580; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
35773581; GCN-NOHSA-SI-NEXT:    buffer_store_dwordx4 v[0:3], off, s[0:3], 0 offset:16 
@@ -4371,8 +4375,10 @@ define amdgpu_kernel void @global_sextload_v64i16_to_v64i32(ptr addrspace(1) %ou
43714375; GCN-NOHSA-SI-NEXT:    buffer_store_dwordx4 v[8:11], off, s[0:3], 0 offset:48 
43724376; GCN-NOHSA-SI-NEXT:    buffer_store_dwordx4 v[4:7], off, s[0:3], 0 
43734377; GCN-NOHSA-SI-NEXT:    buffer_load_dword v0, off, s[12:15], 0 ; 4-byte Folded Reload 
4378+ ; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
43744379; GCN-NOHSA-SI-NEXT:    buffer_load_dword v1, off, s[12:15], 0 offset:4 ; 4-byte Folded Reload 
43754380; GCN-NOHSA-SI-NEXT:    buffer_load_dword v2, off, s[12:15], 0 offset:8 ; 4-byte Folded Reload 
4381+ ; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
43764382; GCN-NOHSA-SI-NEXT:    buffer_load_dword v3, off, s[12:15], 0 offset:12 ; 4-byte Folded Reload 
43774383; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
43784384; GCN-NOHSA-SI-NEXT:    buffer_store_dwordx4 v[0:3], off, s[0:3], 0 offset:16 
@@ -7341,8 +7347,10 @@ define amdgpu_kernel void @global_zextload_v32i16_to_v32i64(ptr addrspace(1) %ou
73417347; GCN-NOHSA-SI-NEXT:    buffer_store_dword v15, off, s[12:15], 0 offset:28 ; 4-byte Folded Spill 
73427348; GCN-NOHSA-SI-NEXT:    s_waitcnt expcnt(0) 
73437349; GCN-NOHSA-SI-NEXT:    buffer_load_dword v12, off, s[12:15], 0 ; 4-byte Folded Reload 
7350+ ; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
73447351; GCN-NOHSA-SI-NEXT:    buffer_load_dword v13, off, s[12:15], 0 offset:4 ; 4-byte Folded Reload 
73457352; GCN-NOHSA-SI-NEXT:    buffer_load_dword v14, off, s[12:15], 0 offset:8 ; 4-byte Folded Reload 
7353+ ; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
73467354; GCN-NOHSA-SI-NEXT:    buffer_load_dword v15, off, s[12:15], 0 offset:12 ; 4-byte Folded Reload 
73477355; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
73487356; GCN-NOHSA-SI-NEXT:    v_mov_b32_e32 v13, v39 
@@ -7364,8 +7372,10 @@ define amdgpu_kernel void @global_zextload_v32i16_to_v32i64(ptr addrspace(1) %ou
73647372; GCN-NOHSA-SI-NEXT:    buffer_store_dwordx4 v[4:7], off, s[0:3], 0 offset:96 
73657373; GCN-NOHSA-SI-NEXT:    buffer_store_dwordx4 v[8:11], off, s[0:3], 0 offset:64 
73667374; GCN-NOHSA-SI-NEXT:    buffer_load_dword v0, off, s[12:15], 0 offset:16 ; 4-byte Folded Reload 
7375+ ; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
73677376; GCN-NOHSA-SI-NEXT:    buffer_load_dword v1, off, s[12:15], 0 offset:20 ; 4-byte Folded Reload 
73687377; GCN-NOHSA-SI-NEXT:    buffer_load_dword v2, off, s[12:15], 0 offset:24 ; 4-byte Folded Reload 
7378+ ; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
73697379; GCN-NOHSA-SI-NEXT:    buffer_load_dword v3, off, s[12:15], 0 offset:28 ; 4-byte Folded Reload 
73707380; GCN-NOHSA-SI-NEXT:    s_waitcnt vmcnt(0) 
73717381; GCN-NOHSA-SI-NEXT:    buffer_store_dwordx4 v[0:3], off, s[0:3], 0 offset:32 
0 commit comments