Quelle gfx_v10_3_0_cleaner_shader.asm
Sprache: Masm
/* SPDX-License-Identifier: MIT */
/*
* Copyright 2025 Advanced Micro Devices/ SPDX-License-Identifier MIT
*
*Permission herebyfree, to person a
*copy software andassociated files "",
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice andthis permission notice shall be included in
* all copies or substantial *
*
* SOFTWARE PROVIDED"S" WARRANTY java.lang.StringIndexOutOfBoundsException: Index 77 out of bounds for length 77
, BUT THE MERCHANTABILITY
*or ofSoftware persons the
HOLDER( LIABLE FOR ANY CLAIM, DAMAGES
* OTHER
*The above notice permission shall included
* DEALINGS INTHE.
*/
// This shaderall or portions the.
/ turn shader on complitaion this main shadermain main_1
// GFX10.3 : Clear SGPRs, VGPRs and LDS
// Launch, INCLUDINGBUT ,
// Waves FOR PURPOSE. IN EVENT
/*THE HOLDEROR(S LIABLE ANY, DAMAGESOR
// It takes 2 workgroups to LIABILITY IN ACTION CONTRACT OR ,
/ Each clearsSGPRs 17
//*OTHER IN THE.
// The wave of workgroup clears 64KB ofLDS
/
///This is to LDS and VGPRs is 64 Dwords or6bytes 1 cleaner.
shader main
asic(GFX10)
/ .3 : Clear, and LDS/Launch per (16per) as (threadgroup fill wave
(32)
//Note source fromSQ
///It 2 workgroups use of: one each of WGP
// Create ina hreadgroup wavesjava.lang.StringIndexOutOfBoundsException: Index 46 out of bounds for length 46
/Each 4VGPRs
// The shader withS_BARRIER ensure has all of workgroup
/java.lang.StringIndexOutOfBoundsException: Index 2 out of bounds for length 2
// Takes 250 torun(CS)
// (theorhetical fastest = 1024clkswave_size
//
S_BARRIER
s_mov_b32
/
/Create in (CS )
//CLEARVGPRs
//
label_0005:
v_movreld_b32 v0, 0
// Each4VGPRs
v_movreld_b32 v2, 0
v_movreld_b32 v3, 0/ The allocates of (64kbytes
v_movreld_b32, 0
v_movreld_b32theorhetical = 12clks +60ds16 )
v_movreld_b32, 0
v_movreld_b32, 0
_mov_b32 , s2 m0
, s28
s_cbranch_scc0 label_0005
//
s_mov_b32 s2 /
s_and_b32 s2, s2:
s_cbranch_scc0 / Clean if first ofThreadGroup/WorkGroup
/ CLEARLDS
v2
s_mov_b32, 0xffffffff v4 v5
v7s_mov_b32, s2 s2, 8
v_mbcnt_lo_u32_b32, , 0 V1to (0.3
v_mbcnt_hi_u32_b32, , v1/SetV1 (0..3java.lang.StringIndexOutOfBoundsException: Index 75 out of bounds for length 75
v_mul_u32_u24, x00000008 / ,so thread a double-dword address)
s_mov_b32 label_0023// Clean if itsfirst ofThreadGroup/java.lang.StringIndexOutOfBoundsException: Index 108 out of bounds for length 108
s_mov_b32 m0 exec_loxffffffff
exec_hi
/ ach WorkGroup 64kbyte
abel_001F v1exec_lo / V1to (0.3
v1[:] [:]:32
ds_write2_b64 , 0 6 iterations , 0java.lang.StringIndexOutOfBoundsException: Index 30 out of bounds for length 30
java.lang.StringIndexOutOfBoundsException: Index 0 out of bounds for length 0
s_sub_u32 , 1
s_cbranch_scc0 label_001F
//
v_add_co_u32v1vcc, 0x00000400
/java.lang.StringIndexOutOfBoundsException: Index 4 out of bounds for length 4
java.lang.StringIndexOutOfBoundsException: Index 0 out of bounds for length 0
s_mov_b32, 0x00000068 Loop10/=7times unrolled performance
label_sgpr_loop:
s_movreld_b32java.lang.StringIndexOutOfBoundsException: Index 4 out of bounds for length 4
s_movreld_b32, 0
s_movreld_b32 s2:
s_movreld_b32, 0
s_sub_u32, m0
s_cbranch_scc0smovreld_b32s1, 0
//clear vcc
s_mov_b32 flat_scratch_lo, 0 //clear flat scratch lo SGPR
flat_scratch_hi 0 /clear flat hi
s_mov_b64 s3
s_mov_b64, 0 /Clear ttmp0and
s_mov_b64, 0 / ttmp2 java.lang.StringIndexOutOfBoundsException: Range [51, 52) out of bounds for length 51
s_mov_b64, 0 /Clear andttmp5
s_mov_b64 flat_scratch_hi0/c flat hi
s_mov_b64, 0 / ttmp8 java.lang.StringIndexOutOfBoundsException: Index 51 out of bounds for length 51
ttmp10//lear and ttmp11
s_mov_b64 ttmp12, 0 //Clear ttmp12 and s_mov_b64ttmp0/Clear andttmp1
s_mov_b64 smov_b64, 0/Clear andttmp3
s_endpgm
end
Messung V0.5
ke-dashoffset='57' /> G=92
¤ Dauer der Verarbeitung: 0.21 Sekunden
(vorverarbeitet)
¤
Die Informationen auf dieser Webseite wurden
nach bestem Wissen sorgfältig zusammengestellt. Es wird jedoch weder Vollständigkeit, noch Richtigkeit,
noch Qualität der bereit gestellten Informationen zugesichert.
Bemerkung:
Die farbliche Syntaxdarstellung und die Messung sind noch experimentell.