File tree Expand file tree Collapse file tree
include/ck/tensor_operation/gpu/grid Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -579,19 +579,17 @@ struct GridwiseGemm_wmma_cshuffle_v3
579579 NPerBlock * KPerBlock / NWave / WaveSize * sizeof (ComputeTypeB) / sizeof (uint32_t );
580580 // WMMA input is duplicated in GFX11
581581 constexpr index_t InputVgprCount = IsGfx11 ? BaseInputVgprCount * 2 : BaseInputVgprCount;
582- // VGPR used in buffer load and LDS store
583- constexpr index_t TempVgprCount = BaseInputVgprCount / 2 ;
584582 // VGPR used in Accumulator
585583 constexpr index_t AccVgprCount =
586584 MPerBlock * NPerBlock / BlockSize * sizeof (AccDataType) / sizeof (uint32_t );
587585
588586 if constexpr (BlkGemmPipelineVer == BlockGemmPipelineVersion::v1)
589587 {
590- return InputVgprCount + TempVgprCount + AccVgprCount;
588+ return InputVgprCount + AccVgprCount;
591589 }
592590 else if constexpr (BlkGemmPipelineVer == BlockGemmPipelineVersion::v3)
593591 {
594- return InputVgprCount * 2 + TempVgprCount + AccVgprCount;
592+ return InputVgprCount * 2 + AccVgprCount;
595593 }
596594 else
597595 {
You can’t perform that action at this time.
0 commit comments