Skip to content

Commit 14967a2

Browse files
committed
Remove TempVgprCount to reduce the risk of regression
1 parent 94cf7e4 commit 14967a2

1 file changed

Lines changed: 2 additions & 4 deletions

File tree

include/ck/tensor_operation/gpu/grid/gridwise_gemm_wmma_cshuffle_v3.hpp

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -579,19 +579,17 @@ struct GridwiseGemm_wmma_cshuffle_v3
579579
NPerBlock * KPerBlock / NWave / WaveSize * sizeof(ComputeTypeB) / sizeof(uint32_t);
580580
// WMMA input is duplicated in GFX11
581581
constexpr index_t InputVgprCount = IsGfx11 ? BaseInputVgprCount * 2 : BaseInputVgprCount;
582-
// VGPR used in buffer load and LDS store
583-
constexpr index_t TempVgprCount = BaseInputVgprCount / 2;
584582
// VGPR used in Accumulator
585583
constexpr index_t AccVgprCount =
586584
MPerBlock * NPerBlock / BlockSize * sizeof(AccDataType) / sizeof(uint32_t);
587585

588586
if constexpr(BlkGemmPipelineVer == BlockGemmPipelineVersion::v1)
589587
{
590-
return InputVgprCount + TempVgprCount + AccVgprCount;
588+
return InputVgprCount + AccVgprCount;
591589
}
592590
else if constexpr(BlkGemmPipelineVer == BlockGemmPipelineVersion::v3)
593591
{
594-
return InputVgprCount * 2 + TempVgprCount + AccVgprCount;
592+
return InputVgprCount * 2 + AccVgprCount;
595593
}
596594
else
597595
{

0 commit comments

Comments
 (0)