@@ -777,117 +777,57 @@ define amdgpu_gfx void @test_call_void_func_void_preserves_v40(ptr addrspace(1)
777
777
ret void
778
778
}
779
779
780
- define hidden void @void_func_void_clobber_s33 () #1 {
780
+ define hidden amdgpu_gfx void @void_func_void_clobber_s33 () #1 {
781
781
; GFX9-LABEL: void_func_void_clobber_s33:
782
782
; GFX9: ; %bb.0:
783
783
; GFX9-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
784
- ; GFX9-NEXT: s_xor_saveexec_b64 s[4:5], -1
785
- ; GFX9-NEXT: buffer_store_dword v0, off, s[0:3], s32 ; 4-byte Folded Spill
786
- ; GFX9-NEXT: s_mov_b64 exec, s[4:5]
787
- ; GFX9-NEXT: v_writelane_b32 v0, s33, 0
788
784
; GFX9-NEXT: ;;#ASMSTART
789
785
; GFX9-NEXT: ; clobber
790
786
; GFX9-NEXT: ;;#ASMEND
791
- ; GFX9-NEXT: v_readlane_b32 s33, v0, 0
792
- ; GFX9-NEXT: s_xor_saveexec_b64 s[4:5], -1
793
- ; GFX9-NEXT: buffer_load_dword v0, off, s[0:3], s32 ; 4-byte Folded Reload
794
- ; GFX9-NEXT: s_mov_b64 exec, s[4:5]
795
- ; GFX9-NEXT: s_waitcnt vmcnt(0)
796
787
; GFX9-NEXT: s_setpc_b64 s[30:31]
797
788
;
798
789
; GFX10-LABEL: void_func_void_clobber_s33:
799
790
; GFX10: ; %bb.0:
800
791
; GFX10-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
801
- ; GFX10-NEXT: s_xor_saveexec_b32 s4, -1
802
- ; GFX10-NEXT: buffer_store_dword v0, off, s[0:3], s32 ; 4-byte Folded Spill
803
- ; GFX10-NEXT: s_waitcnt_depctr 0xffe3
804
- ; GFX10-NEXT: s_mov_b32 exec_lo, s4
805
- ; GFX10-NEXT: v_writelane_b32 v0, s33, 0
806
792
; GFX10-NEXT: ;;#ASMSTART
807
793
; GFX10-NEXT: ; clobber
808
794
; GFX10-NEXT: ;;#ASMEND
809
- ; GFX10-NEXT: v_readlane_b32 s33, v0, 0
810
- ; GFX10-NEXT: s_xor_saveexec_b32 s4, -1
811
- ; GFX10-NEXT: buffer_load_dword v0, off, s[0:3], s32 ; 4-byte Folded Reload
812
- ; GFX10-NEXT: s_waitcnt_depctr 0xffe3
813
- ; GFX10-NEXT: s_mov_b32 exec_lo, s4
814
- ; GFX10-NEXT: s_waitcnt vmcnt(0)
815
795
; GFX10-NEXT: s_setpc_b64 s[30:31]
816
796
;
817
797
; GFX11-LABEL: void_func_void_clobber_s33:
818
798
; GFX11: ; %bb.0:
819
799
; GFX11-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
820
- ; GFX11-NEXT: s_xor_saveexec_b32 s0, -1
821
- ; GFX11-NEXT: scratch_store_b32 off, v0, s32 ; 4-byte Folded Spill
822
- ; GFX11-NEXT: s_mov_b32 exec_lo, s0
823
- ; GFX11-NEXT: v_writelane_b32 v0, s33, 0
824
800
; GFX11-NEXT: ;;#ASMSTART
825
801
; GFX11-NEXT: ; clobber
826
802
; GFX11-NEXT: ;;#ASMEND
827
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1)
828
- ; GFX11-NEXT: v_readlane_b32 s33, v0, 0
829
- ; GFX11-NEXT: s_xor_saveexec_b32 s0, -1
830
- ; GFX11-NEXT: scratch_load_b32 v0, off, s32 ; 4-byte Folded Reload
831
- ; GFX11-NEXT: s_mov_b32 exec_lo, s0
832
- ; GFX11-NEXT: s_waitcnt vmcnt(0)
833
803
; GFX11-NEXT: s_setpc_b64 s[30:31]
834
804
call void asm sideeffect "; clobber" , "~{s33}" () #0
835
805
ret void
836
806
}
837
807
838
- define hidden void @void_func_void_clobber_s34 () #1 {
808
+ define hidden amdgpu_gfx void @void_func_void_clobber_s34 () #1 {
839
809
; GFX9-LABEL: void_func_void_clobber_s34:
840
810
; GFX9: ; %bb.0:
841
811
; GFX9-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
842
- ; GFX9-NEXT: s_xor_saveexec_b64 s[4:5], -1
843
- ; GFX9-NEXT: buffer_store_dword v0, off, s[0:3], s32 ; 4-byte Folded Spill
844
- ; GFX9-NEXT: s_mov_b64 exec, s[4:5]
845
- ; GFX9-NEXT: v_writelane_b32 v0, s34, 0
846
812
; GFX9-NEXT: ;;#ASMSTART
847
813
; GFX9-NEXT: ; clobber
848
814
; GFX9-NEXT: ;;#ASMEND
849
- ; GFX9-NEXT: v_readlane_b32 s34, v0, 0
850
- ; GFX9-NEXT: s_xor_saveexec_b64 s[4:5], -1
851
- ; GFX9-NEXT: buffer_load_dword v0, off, s[0:3], s32 ; 4-byte Folded Reload
852
- ; GFX9-NEXT: s_mov_b64 exec, s[4:5]
853
- ; GFX9-NEXT: s_waitcnt vmcnt(0)
854
815
; GFX9-NEXT: s_setpc_b64 s[30:31]
855
816
;
856
817
; GFX10-LABEL: void_func_void_clobber_s34:
857
818
; GFX10: ; %bb.0:
858
819
; GFX10-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
859
- ; GFX10-NEXT: s_xor_saveexec_b32 s4, -1
860
- ; GFX10-NEXT: buffer_store_dword v0, off, s[0:3], s32 ; 4-byte Folded Spill
861
- ; GFX10-NEXT: s_waitcnt_depctr 0xffe3
862
- ; GFX10-NEXT: s_mov_b32 exec_lo, s4
863
- ; GFX10-NEXT: v_writelane_b32 v0, s34, 0
864
820
; GFX10-NEXT: ;;#ASMSTART
865
821
; GFX10-NEXT: ; clobber
866
822
; GFX10-NEXT: ;;#ASMEND
867
- ; GFX10-NEXT: v_readlane_b32 s34, v0, 0
868
- ; GFX10-NEXT: s_xor_saveexec_b32 s4, -1
869
- ; GFX10-NEXT: buffer_load_dword v0, off, s[0:3], s32 ; 4-byte Folded Reload
870
- ; GFX10-NEXT: s_waitcnt_depctr 0xffe3
871
- ; GFX10-NEXT: s_mov_b32 exec_lo, s4
872
- ; GFX10-NEXT: s_waitcnt vmcnt(0)
873
823
; GFX10-NEXT: s_setpc_b64 s[30:31]
874
824
;
875
825
; GFX11-LABEL: void_func_void_clobber_s34:
876
826
; GFX11: ; %bb.0:
877
827
; GFX11-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
878
- ; GFX11-NEXT: s_xor_saveexec_b32 s0, -1
879
- ; GFX11-NEXT: scratch_store_b32 off, v0, s32 ; 4-byte Folded Spill
880
- ; GFX11-NEXT: s_mov_b32 exec_lo, s0
881
- ; GFX11-NEXT: v_writelane_b32 v0, s34, 0
882
828
; GFX11-NEXT: ;;#ASMSTART
883
829
; GFX11-NEXT: ; clobber
884
830
; GFX11-NEXT: ;;#ASMEND
885
- ; GFX11-NEXT: s_delay_alu instid0(VALU_DEP_1)
886
- ; GFX11-NEXT: v_readlane_b32 s34, v0, 0
887
- ; GFX11-NEXT: s_xor_saveexec_b32 s0, -1
888
- ; GFX11-NEXT: scratch_load_b32 v0, off, s32 ; 4-byte Folded Reload
889
- ; GFX11-NEXT: s_mov_b32 exec_lo, s0
890
- ; GFX11-NEXT: s_waitcnt vmcnt(0)
891
831
; GFX11-NEXT: s_setpc_b64 s[30:31]
892
832
call void asm sideeffect "; clobber" , "~{s34}" () #0
893
833
ret void
0 commit comments