@@ -626,8 +626,6 @@ define amdgpu_kernel void @global_atomic_fadd_uni_address_div_value_agent_scope_
626
626
; GFX1164-NEXT: s_waitcnt lgkmcnt(0)
627
627
; GFX1164-NEXT: global_atomic_add_f32 v0, v1, s[0:1]
628
628
; GFX1164-NEXT: .LBB1_4:
629
- ; GFX1164-NEXT: s_nop 0
630
- ; GFX1164-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
631
629
; GFX1164-NEXT: s_endpgm
632
630
;
633
631
; GFX1132-LABEL: global_atomic_fadd_uni_address_div_value_agent_scope_align4_unsafe:
@@ -675,8 +673,6 @@ define amdgpu_kernel void @global_atomic_fadd_uni_address_div_value_agent_scope_
675
673
; GFX1132-NEXT: s_waitcnt lgkmcnt(0)
676
674
; GFX1132-NEXT: global_atomic_add_f32 v0, v1, s[0:1]
677
675
; GFX1132-NEXT: .LBB1_4:
678
- ; GFX1132-NEXT: s_nop 0
679
- ; GFX1132-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
680
676
; GFX1132-NEXT: s_endpgm
681
677
;
682
678
; GFX9-DPP-LABEL: global_atomic_fadd_uni_address_div_value_agent_scope_align4_unsafe:
@@ -988,8 +984,6 @@ define amdgpu_kernel void @global_atomic_fadd_uni_address_div_value_agent_scope_
988
984
; GFX1164-DPP-NEXT: s_waitcnt lgkmcnt(0)
989
985
; GFX1164-DPP-NEXT: global_atomic_add_f32 v4, v0, s[0:1]
990
986
; GFX1164-DPP-NEXT: .LBB1_2:
991
- ; GFX1164-DPP-NEXT: s_nop 0
992
- ; GFX1164-DPP-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
993
987
; GFX1164-DPP-NEXT: s_endpgm
994
988
;
995
989
; GFX1132-DPP-LABEL: global_atomic_fadd_uni_address_div_value_agent_scope_align4_unsafe:
@@ -1051,8 +1045,6 @@ define amdgpu_kernel void @global_atomic_fadd_uni_address_div_value_agent_scope_
1051
1045
; GFX1132-DPP-NEXT: s_waitcnt lgkmcnt(0)
1052
1046
; GFX1132-DPP-NEXT: global_atomic_add_f32 v4, v0, s[0:1]
1053
1047
; GFX1132-DPP-NEXT: .LBB1_2:
1054
- ; GFX1132-DPP-NEXT: s_nop 0
1055
- ; GFX1132-DPP-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
1056
1048
; GFX1132-DPP-NEXT: s_endpgm
1057
1049
%divValue = call float @div.float.value ()
1058
1050
%result = atomicrmw fadd ptr addrspace (1 ) %ptr , float %divValue syncscope("agent" ) monotonic , align 4
@@ -3042,8 +3034,6 @@ define amdgpu_kernel void @global_atomic_fadd_uni_address_div_value_agent_scope_
3042
3034
; GFX1164-NEXT: s_waitcnt lgkmcnt(0)
3043
3035
; GFX1164-NEXT: global_atomic_add_f32 v0, v1, s[0:1]
3044
3036
; GFX1164-NEXT: .LBB5_4:
3045
- ; GFX1164-NEXT: s_nop 0
3046
- ; GFX1164-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
3047
3037
; GFX1164-NEXT: s_endpgm
3048
3038
;
3049
3039
; GFX1132-LABEL: global_atomic_fadd_uni_address_div_value_agent_scope_unsafe:
@@ -3091,8 +3081,6 @@ define amdgpu_kernel void @global_atomic_fadd_uni_address_div_value_agent_scope_
3091
3081
; GFX1132-NEXT: s_waitcnt lgkmcnt(0)
3092
3082
; GFX1132-NEXT: global_atomic_add_f32 v0, v1, s[0:1]
3093
3083
; GFX1132-NEXT: .LBB5_4:
3094
- ; GFX1132-NEXT: s_nop 0
3095
- ; GFX1132-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
3096
3084
; GFX1132-NEXT: s_endpgm
3097
3085
;
3098
3086
; GFX9-DPP-LABEL: global_atomic_fadd_uni_address_div_value_agent_scope_unsafe:
@@ -3404,8 +3392,6 @@ define amdgpu_kernel void @global_atomic_fadd_uni_address_div_value_agent_scope_
3404
3392
; GFX1164-DPP-NEXT: s_waitcnt lgkmcnt(0)
3405
3393
; GFX1164-DPP-NEXT: global_atomic_add_f32 v4, v0, s[0:1]
3406
3394
; GFX1164-DPP-NEXT: .LBB5_2:
3407
- ; GFX1164-DPP-NEXT: s_nop 0
3408
- ; GFX1164-DPP-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
3409
3395
; GFX1164-DPP-NEXT: s_endpgm
3410
3396
;
3411
3397
; GFX1132-DPP-LABEL: global_atomic_fadd_uni_address_div_value_agent_scope_unsafe:
@@ -3467,8 +3453,6 @@ define amdgpu_kernel void @global_atomic_fadd_uni_address_div_value_agent_scope_
3467
3453
; GFX1132-DPP-NEXT: s_waitcnt lgkmcnt(0)
3468
3454
; GFX1132-DPP-NEXT: global_atomic_add_f32 v4, v0, s[0:1]
3469
3455
; GFX1132-DPP-NEXT: .LBB5_2:
3470
- ; GFX1132-DPP-NEXT: s_nop 0
3471
- ; GFX1132-DPP-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
3472
3456
; GFX1132-DPP-NEXT: s_endpgm
3473
3457
%divValue = call float @div.float.value ()
3474
3458
%result = atomicrmw fadd ptr addrspace (1 ) %ptr , float %divValue syncscope("agent" ) monotonic
@@ -3770,8 +3754,6 @@ define amdgpu_kernel void @global_atomic_fadd_uni_address_div_value_agent_scope_
3770
3754
; GFX1164-NEXT: s_waitcnt lgkmcnt(0)
3771
3755
; GFX1164-NEXT: global_atomic_add_f32 v0, v1, s[0:1]
3772
3756
; GFX1164-NEXT: .LBB6_4:
3773
- ; GFX1164-NEXT: s_nop 0
3774
- ; GFX1164-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
3775
3757
; GFX1164-NEXT: s_endpgm
3776
3758
;
3777
3759
; GFX1132-LABEL: global_atomic_fadd_uni_address_div_value_agent_scope_unsafe_structfp:
@@ -3819,8 +3801,6 @@ define amdgpu_kernel void @global_atomic_fadd_uni_address_div_value_agent_scope_
3819
3801
; GFX1132-NEXT: s_waitcnt lgkmcnt(0)
3820
3802
; GFX1132-NEXT: global_atomic_add_f32 v0, v1, s[0:1]
3821
3803
; GFX1132-NEXT: .LBB6_4:
3822
- ; GFX1132-NEXT: s_nop 0
3823
- ; GFX1132-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
3824
3804
; GFX1132-NEXT: s_endpgm
3825
3805
;
3826
3806
; GFX9-DPP-LABEL: global_atomic_fadd_uni_address_div_value_agent_scope_unsafe_structfp:
@@ -4132,8 +4112,6 @@ define amdgpu_kernel void @global_atomic_fadd_uni_address_div_value_agent_scope_
4132
4112
; GFX1164-DPP-NEXT: s_waitcnt lgkmcnt(0)
4133
4113
; GFX1164-DPP-NEXT: global_atomic_add_f32 v4, v0, s[0:1]
4134
4114
; GFX1164-DPP-NEXT: .LBB6_2:
4135
- ; GFX1164-DPP-NEXT: s_nop 0
4136
- ; GFX1164-DPP-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
4137
4115
; GFX1164-DPP-NEXT: s_endpgm
4138
4116
;
4139
4117
; GFX1132-DPP-LABEL: global_atomic_fadd_uni_address_div_value_agent_scope_unsafe_structfp:
@@ -4195,8 +4173,6 @@ define amdgpu_kernel void @global_atomic_fadd_uni_address_div_value_agent_scope_
4195
4173
; GFX1132-DPP-NEXT: s_waitcnt lgkmcnt(0)
4196
4174
; GFX1132-DPP-NEXT: global_atomic_add_f32 v4, v0, s[0:1]
4197
4175
; GFX1132-DPP-NEXT: .LBB6_2:
4198
- ; GFX1132-DPP-NEXT: s_nop 0
4199
- ; GFX1132-DPP-NEXT: s_sendmsg sendmsg(MSG_DEALLOC_VGPRS)
4200
4176
; GFX1132-DPP-NEXT: s_endpgm
4201
4177
%divValue = call float @div.float.value ()
4202
4178
%result = atomicrmw fadd ptr addrspace (1 ) %ptr , float %divValue syncscope("agent" ) monotonic
0 commit comments